<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article article-type="systematic-review" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. RNA Res.</journal-id>
<journal-title>Frontiers in RNA Research</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. RNA Res.</abbrev-journal-title>
<issn pub-type="epub">2813-7116</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1419979</article-id>
<article-id pub-id-type="doi">10.3389/frnar.2024.1419979</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>RNA Research</subject>
<subj-group>
<subject>Systematic Review</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Compilation of resources on subcellular localization of lncRNA</article-title>
<alt-title alt-title-type="left-running-head">Choudhury et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/frnar.2024.1419979">10.3389/frnar.2024.1419979</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Choudhury</surname>
<given-names>Shubham</given-names>
</name>
<uri xlink:href="https://loop.frontiersin.org/people/990170/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rathore</surname>
<given-names>Anand Singh</given-names>
</name>
<uri xlink:href="https://loop.frontiersin.org/people/2752670/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Raghava</surname>
<given-names>Gajendra P. S.</given-names>
</name>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/301928/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff>
<institution>Department of Computational Biology</institution>, <institution>Indraprastha Institute of Information Technology</institution>, <addr-line>New Delhi</addr-line>, <country>India</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1132483/overview">Alessandro Paolini</ext-link>, Bambino Ges&#xf9; Children&#x2019;s Hospital (IRCCS), Italy</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/374295/overview">Giovannino Silvestri</ext-link>, University of Maryland Medical Center, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2025285/overview">Maxime Wery</ext-link>, Institut Curie, France</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Gajendra P. S. Raghava, <email>raghava@iiitd.ac.in</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>06</day>
<month>06</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>2</volume>
<elocation-id>1419979</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>04</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>17</day>
<month>05</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Choudhury, Rathore and Raghava.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Choudhury, Rathore and Raghava</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Long non-coding RNAs (lncRNAs) play a vital role in biological processes, and their dysfunctions lead to a wide range of diseases. Due to advancements in sequencing technology, more than 20,000 lncRNA transcripts have been identified in humans, almost equivalent to coding transcripts. One crucial aspect in annotating lncRNA function is predicting their subcellular localization, which often determines their functional roles within cells. This review aims to cover the experimental techniques, databases, and <italic>in silico</italic> tools developed for identifying subcellular localization. Firstly, we discuss the experimental methods employed to determine the subcellular localization of lncRNAs. These techniques provide valuable insights into the precise cellular compartments where lncRNAs reside. Secondly, we explore the available computational resources and databases contributing to our understanding of lncRNAs, including information on their subcellular localization. These computational methods utilize algorithms and machine learning approaches to predict lncRNA subcellular locations using sequence and structural features. Lastly, we discuss the limitations of existing methodologies, future challenges, and potential applications of subcellular localization prediction for lncRNAs. We highlight the need for further advancements in computational methods and experimental validation to enhance the accuracy and reliability of subcellular localization predictions. To support the scientific community, we have developed a platform called LncInfo, which offers comprehensive information on lncRNAs, including their subcellular localization. This platform aims to consolidate and provide accessible resources to researchers studying lncRNAs and their functional roles (<ext-link ext-link-type="uri" xlink:href="http://webs.iiitd.edu.in/raghava/lncinfo">http://webs.iiitd.edu.in/raghava/lncinfo</ext-link>).</p>
</abstract>
<kwd-group>
<kwd>subcellular localization</kwd>
<kwd>multi-label localization</kwd>
<kwd>lncRNA</kwd>
<kwd>databases</kwd>
<kwd>prediction methods</kwd>
<kwd>experimental techniques</kwd>
</kwd-group>
<contract-num rid="cn001">BT/PR40158/BTIS/137/24/2021</contract-num>
<contract-sponsor id="cn001">Department of Biotechnology, Ministry of Science and Technology, India<named-content content-type="fundref-id">10.13039/501100001407</named-content>
</contract-sponsor>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Non-coding RNA</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Human genomes contain around 3 billion base pairs, whereas the Human Genome Project (HGP) shows that the human genome contains only 20,000 protein-coding genes. It means only a fraction of the human genome codes for proteins that indicate the role of the non-coding region of the genome (<xref ref-type="bibr" rid="B68">ENCODE Project Consortium, 2012</xref>). Among the non-coding genome transcripts, lncRNA has gained significant interest due to its involvement in biological and disease-related functions of specific genes. The ENCODE and FANTOM projects have provided insights into the mammalian transcriptome and indicate that the genome has a significant number of lncRNAs. One of the major challenges in the postgenomic era is annotating these lncRNAs&#x2019; function. In the past, a significant focus was on protein-coding transcripts. Identifying domains, family classification, subcellular localization, and biological function are the primary aspects of functional annotation of a biological entity.</p>
<p>Subcellular localization forms an integral part of functional annotation because, for lncRNA genes, the ultimate product is RNA. Therefore, lncRNA functions depend on proximity-based RNA physical interactions. Studying lncRNA subcellular localization and its dynamic changes is a crucial step toward elucidating the functions and mechanisms of newly discovered lncRNAs. The specific localization of lncRNAs within subcellular compartments allows them to exert precise regulatory effects on gene expression. Recent reviews have discussed how nuclear-localized lncRNAs, can interact with chromatin, participate in epigenetic modifications that influence transcriptional regulation and chromatin organization, and are crucial for organizing the three-dimensional architecture of the genome, contributing to genome organization, transcriptional regulation, and genome stability (<xref ref-type="bibr" rid="B56">Romero-Barrios et al., 2018</xref>; <xref ref-type="bibr" rid="B54">Pisignano and Ladomery, 2021</xref>; <xref ref-type="bibr" rid="B63">Statello et al., 2021</xref>).</p>
<p>According to the review by <xref ref-type="bibr" rid="B21">Dykes and Emanueli (2017)</xref>, lncRNAs localized to the cytoplasm can be associated with ribonucleoprotein granules, such as P-bodies or stress granules, modulating mRNA stability and translation. In the review by <xref ref-type="bibr" rid="B63">Statello et al. (2021)</xref> they have discussed how specific lncRNAs localize to specialized subcellular domains, such as neuronal dendrites or axons, where they are involved in RNA transport and local translation, impacting synaptic plasticity and neuronal development. LncRNAs also contribute to signaling pathways by localizing to specific cellular compartments, such as the plasma membrane or cytoplasmic signaling bodies, interacting with signaling proteins, acting as scaffolds, or regulating protein localization. In summary, the precise localization of lncRNAs within cells is essential for their regulatory roles in gene expression, cellular trafficking, signaling, and nuclear organization, highlighting their diverse and significant biological importance. Recent studies have identified certain lncRNAs that may have been misannotated, as they possessed short open reading frames (sORFs) (<xref ref-type="bibr" rid="B14">Carlevaro-Fita et al., 2016</xref>; <xref ref-type="bibr" rid="B33">Hartford and Lal, 2020</xref>; <xref ref-type="bibr" rid="B3">Andjus et al., 2024</xref>). Some of these sORFs encode small proteins or micropeptides with a wide array of fundamental biological functions, including cell division, transcription regulation and cell signaling (<xref ref-type="bibr" rid="B15">Chen et al., 2020</xref>; <xref ref-type="bibr" rid="B78">Wei and Guo, 2020</xref>).</p>
<p>Several experimental techniques like fluorescent <italic>in-situ</italic> hybridization (FISH), MS2-system-based techniques, and high-throughput RNA sequencing are used for <italic>in vitro</italic> visualization of mRNA location to trace its subcellular localization (<xref ref-type="bibr" rid="B23">Fagerberg et al., 2014</xref>; <xref ref-type="bibr" rid="B74">Wang et al., 2021</xref>; <xref ref-type="bibr" rid="B85">Zhang et al., 2021</xref>). These methods remain the gold standard for studying the subcellular localization of lncRNAs. These experimental techniques have limitations, including cost, time, and the need for sophisticated instrumentation as discussed by <xref ref-type="bibr" rid="B58">Savulescu et al. (2021)</xref> in their perspective article. FISH-based methods suffer from artifacts when multiplexing is done. Also, the detection efficiency decreases as the number of RNA targets increases in FISH-based methods. Current methods find it hard to balance target number and detection efficiency, highlighting the significant limitations in generating subcellular localization information.</p>
<p>These issues highlight the need to develop computational methods for lncRNA subcellular localization prediction. An extensive repertoire of computational resources has already been developed to help predict the subcellular localization of lncRNA. However, the dataset remains the same, more or less sourced from RNALocate version 1. The number of lncRNA sequences in RNALocate (version 2) has decreased significantly, leaving researchers needing more localization information. Other existing databases harboring localization data must be updated frequently, making them outdated for computational model development.</p>
<p>Few review articles have recently been published discussing the advances in tools designed for predicting lncRNA subcellular localization. Among these, <xref ref-type="bibr" rid="B75">Wang et al. (2021)</xref> published a review on lncRNA subcellular localization prediction tools. They have covered four tools in terms of&#x2014;dataset used, data preprocessing, feature extraction, and algorithm for prediction. Firstly, they provided an overview of all the tools and then described each attribute separately. However, the review by <xref ref-type="bibr" rid="B4">Asim et al. (2021)</xref> has a broader domain&#x2014;covering RNA classification and RNA subcellular localization. Much of the review focuses on the RNA classification tool, as much work has been done in that field. A brief description of the tools designed to predict subcellular localization is provided, and they cover three types of RNA&#x2014;mRNA, miRNA, and lncRNA. In this article, we will complement the information provided in existing reviews by including newer methods. Additionally, we have reviewed all the databases that harbor information on lncRNA subcellular localization.</p>
<p>To consolidate all the information, we collected while writing this review, we have developed a web resource called&#x2014;&#x201c;LncInfo,&#x201d; developed using HTML5 and Apache.</p>
</sec>
<sec id="s2">
<title>2 Existing databases on lncRNA</title>
<p>Due to the rapid growth in lncRNA research, large-scale data is being generated, and this information is annotated correctly and stored in various databases that are designed to aid researchers. Most of the databases were developed post-2015 when there was a surge in high throughput methods for studying lncRNA. A list of the popular databases based on lncRNA is provided in <xref ref-type="table" rid="T1">Table 1</xref>. All the existing databases have been graphically presented in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>An overview of the different classes of databases developed for lncRNA.</p>
</caption>
<graphic xlink:href="frnar-02-1419979-g001.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Summary of existing databases on lncRNA.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Database</th>
<th align="left">Brief description</th>
<th align="left">Website link</th>
<th align="left">Reference</th>
<th align="left">Year</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td colspan="5" align="left">General databases</td>
</tr>
<tr>
<td align="left">FANTOM Cat</td>
<td align="left">A database for functional annotation of the mammalian genome</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://fantom.gsc.riken.jp/cat/">https://fantom.gsc.riken.jp/cat/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B35">Hon et al. (2017)</xref>
</td>
<td align="left">2017</td>
</tr>
<tr>
<td align="left">GENCODE</td>
<td align="left">A database that provides comprehensive gene annotation for the human and mouse genome</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://www.gencodegenes.org/">https://www.gencodegenes.org/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B27">Frankish et al. (2019)</xref>
</td>
<td align="left">2022</td>
</tr>
<tr>
<td colspan="5" align="left">Expression databases</td>
</tr>
<tr>
<td align="left">ENCODE</td>
<td align="left">A database of functional annotation based on sequencing data</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://www.encodeproject.org/">https://www.encodeproject.org/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B49">Luo et al. (2020)</xref>
</td>
<td align="left">2018</td>
</tr>
<tr>
<td align="left">lncExpDB</td>
<td align="left">A comprehensive database of experimentally validated lncRNA and circRNA.</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://ngdc.cncb.ac.cn/lncexpdb/">https://ngdc.cncb.ac.cn/lncexpdb/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B45">Li et al. (2021)</xref>
</td>
<td align="left">2021</td>
</tr>
<tr>
<td align="left">LNCbook 2.0</td>
<td align="left">A database long non-coding RNAs and their functions</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://ngdc.cncb.ac.cn/lncbook/">https://ngdc.cncb.ac.cn/lncbook/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B44">Li et al. (2023b)</xref>
</td>
<td align="left">2023</td>
</tr>
<tr>
<td align="left">GTEx</td>
<td align="left">Genotype-Tissue Expression database</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://gtexportal.org/home/">https://gtexportal.org/home/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B35">Hon et al. (2017)</xref>
</td>
<td align="left">2020</td>
</tr>
<tr>
<td align="left">TANRIC</td>
<td align="left">A database of non-coding RNAs in cancer</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://www.tanric.org/">https://www.tanric.org/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B42">Li et al. (2015)</xref>
</td>
<td align="left">2022</td>
</tr>
<tr>
<td align="left">GEO</td>
<td align="left">A public repository for gene expression</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B6">Barrett et al. (2013)</xref>
</td>
<td align="left">2013</td>
</tr>
<tr>
<td colspan="5" align="left">Sequence Annotation</td>
</tr>
<tr>
<td align="left">LNCipedia</td>
<td align="left">A database for lncRNA sequences and their annotation</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://lncipedia.org/">https://lncipedia.org/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B72">Volders et al. (2019)</xref>
</td>
<td align="left">2018</td>
</tr>
<tr>
<td align="left">CANTATAdb</td>
<td align="left">A database of long non-coding RNAs in plants</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://cantata.amu.edu.pl/">http://cantata.amu.edu.pl/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B67">Szcze&#x15b;niak et al. (2019)</xref>
</td>
<td align="left">2019</td>
</tr>
<tr>
<td align="left">RNA Atlas</td>
<td align="left">An atlas of human non-coding RNAs</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://r2platform.com/rna_atlas">http://r2platform.com/rna_atlas</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B47">Lorenzi et al. (2021)</xref>
</td>
<td align="left">2021</td>
</tr>
<tr>
<td align="left">NONCODEV6</td>
<td align="left">A database developed to maintain non-coding RNAs and their annotation</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://www.noncode.org/">http://www.noncode.org/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B86">Zhao et al. (2021)</xref>
</td>
<td align="left">2021</td>
</tr>
<tr>
<td align="left">RNACentral</td>
<td align="left">A comprehensive ncRNA sequence collection representing all ncRNA types from a broad range of organisms</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://rnacentral.org/">https://rnacentral.org/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B65">RNAcentral Consortium (2021)</xref>
</td>
<td align="left">2021</td>
</tr>
<tr>
<td align="left">CHESS</td>
<td align="left">A repository that contains human genes and transcripts</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://ccb.jhu.edu/chess">http://ccb.jhu.edu/chess</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B53">Pertea et al. (2018)</xref>
</td>
<td align="left">2022</td>
</tr>
<tr>
<td colspan="5" align="left">Subcellular Localization</td>
</tr>
<tr>
<td align="left">LncAtlas</td>
<td align="left">A quantitative resource for lncRNA subcellular localization</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="https://lncatlas.crg.eu/">https://lncatlas.crg.eu/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B50">Mas-Ponte et al. (2017)</xref>
</td>
<td align="left">2017</td>
</tr>
<tr>
<td align="left">LncSLdb</td>
<td align="left">A manually curated database of RNA subcellular localization</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://bioinformatics.xidian.edu.cn/lncSLdb">http://bioinformatics.xidian.edu.cn/lncSLdb</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B79">Wen et al. (2018)</xref>
</td>
<td align="left">2018</td>
</tr>
<tr>
<td align="left">RnaLocate</td>
<td align="left">Curation of RNA subcellular localization from public resources like literature, RNA-seq datasets</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://www.rna-society.org/rnalocate/">http://www.rna-society.org/rnalocate/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B18">Cui et al. (2022)</xref>
</td>
<td align="left">2021</td>
</tr>
<tr>
<td colspan="5" align="left">Disease Association</td>
</tr>
<tr>
<td align="left">LncRNADisease2</td>
<td align="left">A repository that contains lncRNA and associated diseases</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://www.rnanut.net/lncrnadisease/">http://www.rnanut.net/lncrnadisease/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B5">Bao et al. (2019)</xref>
</td>
<td align="left">2019</td>
</tr>
<tr>
<td align="left">Lnc2Cancer v3.0</td>
<td align="left">A resource for experimentally supported lncRNA/circRNA cancer associations</td>
<td align="left">
<ext-link ext-link-type="uri" xlink:href="http://bio-bigdata.hrbmu.edu.cn/lnc2cancer/">http://bio-bigdata.hrbmu.edu.cn/lnc2cancer/</ext-link>
</td>
<td align="left">
<xref ref-type="bibr" rid="B28">Gao et al. (2021)</xref>
</td>
<td align="left">2020</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="s2-1">
<title>2.1 General databases</title>
<p>The FANTOM5/CAT project is dedicated to exploring the regulatory landscape of human and mouse genomes by generating comprehensive transcriptomic data (<xref ref-type="bibr" rid="B35">Hon et al., 2017</xref>). Researchers may use this vast collection of transcriptome data from many biological contexts as a valuable tool to study the control of gene expression, transcriptional networks, and functional components of the mammalian genome. GENCODE is dedicated to maintaining protein-coding and non-coding genes (<xref ref-type="bibr" rid="B27">Frankish et al., 2019</xref>). Its main objective is to provide a thorough, current, and accurate annotation of these genomes by locating and describing the protein-coding genes, long non-coding RNAs (lncRNAs), and other functional non-coding RNAs. The annotation provides crucial details for the discovered genes and transcripts, such as gene loci, exon boundaries, coding sequences, untranslated regions (UTRs), and functional and structural annotations. There are now 62,703 genes reported by GENCODE, 19,393 of which are protein-coding and 19,928 long non-coding RNAs. In order to create these annotations, the research combines experimental and computational techniques, including high-throughput sequencing technologies, transcriptome data, protein-coding potential analysis, comparative genomics, and manual curation.</p>
</sec>
<sec id="s2-2">
<title>2.2 Expression databases</title>
<p>The ENCODE is a comprehensive repository of experimental data and metadata generated by the ENCODE project (<xref ref-type="bibr" rid="B49">Luo et al., 2020</xref>). The portal utilizes a standardized metadata architecture that facilitates understanding data in biological terms, enabling the representation of experiments and their analyses. The ENCODE database provides researchers access to a wide range of data, including genomic sequences, epigenetic marks, and transcription factor binding sites. LncExpDB is an expression database focused on human long non-coding RNA (lncRNA) genes (<xref ref-type="bibr" rid="B45">Li et al., 2021</xref>). Its main objective is to provide a wide-ranging collection of expression profiles for lncRNA genes, enabling the exploration of their expression characteristics, capacities, and potential functional significance. The database also aims to establish connections between lncRNAs and protein-coding genes across different biological contexts and conditions. LncBook, an extensive repository of lncRNAs) (<xref ref-type="bibr" rid="B44">Li et al., 2023</xref>), which is widely used in various studies. The updated version, LncBook 2.0, offers significant improvements and enhancements. This resource empowers users to unravel the functional significance of lncRNAs within different biological contexts.</p>
<p>The Genotype-Tissue Expression (GTEx) project is a valuable resource for studying human gene expression, regulation, and its association with genetic variation (<xref ref-type="bibr" rid="B35">Hon et al., 2017</xref>). This initiative involves collecting and analyzing gene expression data from tissues obtained from deceased human donors and their corresponding genotypic information. GTEx is an invaluable resource for researchers investigating the intricate relationship between genetic variation, gene expression, and the specific biology of different tissues. Furthermore, it establishes a valuable foundation for investigating the regulatory mechanisms governing gene expression. TANRIC is a database that maintains cancer-associated lncRNAs mainly extracted from TCGA. The Gene Expression Omnibus (GEO) is a globally accessible public repository that houses functional genomic data sets obtained through high-throughput microarray and next-generation sequencing technologies. These resources are indexed, crosslinked, and made searchable to facilitate easy access and exploration (<xref ref-type="bibr" rid="B6">Barrett et al., 2013</xref>).</p>
</sec>
<sec id="s2-3">
<title>2.3 Sequence annotation</title>
<p>LNCipedia is a database for collecting and annotating human long non-coding RNA (lncRNA) sequences (<xref ref-type="bibr" rid="B72">Volders et al., 2019</xref>). One of its main features is the consolidation of redundant transcripts from various sources, resulting in a consistent and reliable database with grouped transcripts. LNCipedia 5 has expanded its content by incorporating new lncRNAs from resources like FANTOM CAT. It also includes minor improvements, such as an enhanced filtering pipeline and support for official HGNC gene names. CANTATADb 2.0 is a database of LncRNAs that maintain lncRNA from plants and algae species (<xref ref-type="bibr" rid="B67">Szcze&#x15b;niak et al., 2019</xref>). Reads from hundreds of RNA-SEQ libraries were aligned with corresponding plant genomes. Gene prediction software was used to re-annotate plant genomes, and annotation data was used as a reference. NONCODE is a comprehensive database of non-coding RNAs, with a particular emphasis on lncRNAs (<xref ref-type="bibr" rid="B86">Zhao et al., 2021</xref>). The number of lncRNAs in NONCODEV6 has reached 644,510 including 173,112 human lncRNA transcript.</p>
<p>RNAcentral is a state-of-the-art database that consolidates the non-coding sequences of 44 RNA resources, including more than 18 million ncRNA sequences from various organisms (<xref ref-type="bibr" rid="B65">RNAcentral Consortium, 2021</xref>). The new version of RNAcentral also contains the secondary structure of 13 million sequences, making it the world&#x2019;s most extensive 2D structure database. CHESS is an extensive collection of human genes derived from approximately 10,000 RNA sequencing experiments (<xref ref-type="bibr" rid="B53">Pertea et al., 2018</xref>). The database comprises a comprehensive set of genes, encompassing 19,838 protein-coding genes and 17,624 lncRNA) genes. RNA Atlas is an experimentally derived database that advances our understanding of human non-coding RNAs (ncRNAs). By analyzing a diverse set of 300 human samples, including 45 tissues, 162 cell types, and 93 cell lines, researchers have expanded the existing catalog of ncRNAs, identifying a total of 44,428 long non-coding RNAs (lncRNAs). This comprehensive dataset, accessible through the R2 webtool, provides a foundation for further exploration of RNA biology and function (<xref ref-type="bibr" rid="B47">Lorenzi et al., 2021</xref>).</p>
</sec>
<sec id="s2-4">
<title>2.4 Subcellular localization</title>
<p>LncATLAS is a subcellular localization database of lncRNA, where information has been obtained from RNA-sequencing data of human cell-lines (<xref ref-type="bibr" rid="B50">Mas-Ponte et al., 2017</xref>). The RNA-seq datasets were obtained from the ENCODE database. In order to quantify subcellular localization, a measure called relative concentration index (RCI) was introduced. LncSLdb is a specialized database designed to collate and manage qualitative and quantitative information on the subcellular localization of lncRNAs (<xref ref-type="bibr" rid="B79">Wen et al., 2018</xref>). The latest release of LncSLdb encompasses data on more than 11,000 lncRNA transcripts derived from three species (human, mouse, and fruit fly). RNALocate v2.0 is a comprehensive repository of information on RNA subcellular localization. It is compiled from scientific literature, public databases, and RNA sequencing datasets (<xref ref-type="bibr" rid="B18">Cui et al., 2022</xref>). It contains around 200 thousand entries, and each entry provides detailed information about RNA, including their subcellular localization. Additionally, it provides three prediction tools to cater to different user requirements.</p>
</sec>
<sec id="s2-5">
<title>2.5 Disease association</title>
<p>The LncRNADisease2 database is dedicated to maintaining ncRNA-associated diseases, including cancer, cardiovascular diseases, and neurological disorders (<xref ref-type="bibr" rid="B5">Bao et al., 2019</xref>). It contains a collection of experimentally validated lncRNAs linked to specific diseases, detailed annotations on their molecular functions, subcellular localizations, interacting proteins, and experimental evidence. The LncRNADisease database documents 205,959 lncRNA-disease associations and 2,297 lncRNA causative associations. The Lnc2Cancer v3.0 database is a comprehensive resource focusing on experimentally validated associations between lncRNAs and cancers (<xref ref-type="bibr" rid="B28">Gao et al., 2021</xref>). The updated version of Lnc2Cancer includes new features, such as an increased number of cancer-associated lncRNA entries. The database also offers details on microRNAs, transcription factors, genetic variations, methylation, enhancers, and other regulatory mechanisms.</p>
</sec>
</sec>
<sec id="s3">
<title>3 Experimental techniques to investigate subcellular localization</title>
<p>One of the primary aspects of the functional annotation of lncRNA is their subcellular localization. The function of lncRNA heavily depends on its location in cells as it interacts with biological molecules in the exact location of the cell (<xref ref-type="bibr" rid="B58">Savulescu et al., 2021</xref>). In order to investigate subcellular localization, many experimental techniques have been developed. <xref ref-type="fig" rid="F2">Figure 2</xref> provides an overview of all the experimental techniques developed in this regard. Deep-sequencing studies have unveiled numerous long non-coding RNAs (lncRNAs) expressed in mammalian genomes, but most remain poorly understood. Essential aspects such as subcellular localization and absolute abundance in single cells remain largely unknown. Knowledge of lncRNA localization can provide insights into their biological functions, while their abundance is crucial for understanding molecular mechanisms. RNA fluorescence <italic>in situ</italic> hybridization (RNA FISH) has been instrumental in uncovering the localization of specific lncRNAs, but conventional methods lack the sensitivity to detect low-abundance lncRNAs. One of the pioneer subcellular localization experiments where X-inactivation by lncRNA XIST was first studied (<xref ref-type="bibr" rid="B10">Brown et al., 1991</xref>; <xref ref-type="bibr" rid="B8">Brockdorff et al., 1992</xref>), utilized a primitive RNA-FISH method to understand the mechanism of action (<xref ref-type="bibr" rid="B9">Brown et al., 1992</xref>) fully. Previously, it was known that XIST could inactivate one X chromosome in females. However, RNA-FISH explained the same&#x2014;indicating how XIST stays in the nucleus and coats the inactive X-chromosome (<xref ref-type="bibr" rid="B10">Brown et al., 1991</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>A graphical representation of the major classes of experimental methods used in lncRNA research.</p>
</caption>
<graphic xlink:href="frnar-02-1419979-g002.tif"/>
</fig>
<p>Further improvement in resolution was achieved when <xref ref-type="bibr" rid="B11">Cabili et al. (2015)</xref> deployed single-molecule RNA-FISH to systematically quantify and categorize the subcellular localization patterns of a representative set of 61 lncRNAs in three different cell types. However, there needs to be a more systematic exploration of lncRNA localization and abundance using these techniques, especially for intergenic lncRNAs (lincRNAs). They observed a wide range of localization patterns, with lncRNAs predominantly localizing to the nucleus. They also found that the low abundance of lncRNAs is not due to a small subset of highly expressing cells and that lncRNAs exhibit similar cell-to-cell heterogeneity as mRNAs.</p>
<p>In this section, we have covered most of the popular experimental techniques. A summary of the existing experimental methods is provided in <xref ref-type="table" rid="T2">Table 2</xref>.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>A summary of the existing experimental techniques to investigate lncRNA.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Methods</th>
<th align="left">Brief description of the method</th>
<th align="left">Pubmed ID</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td colspan="3" align="left">FISH based methods</td>
</tr>
<tr>
<td align="left">smFISH</td>
<td align="left">Experimental technique smFISH (single-molecule FISH) is used for visualization and quantification of RNA molecules in cells</td>
<td align="left">
<xref ref-type="bibr" rid="B25">Femino et al. (1998)</xref>, <xref ref-type="bibr" rid="B55">Raj and Tyagi (2010)</xref>, <xref ref-type="bibr" rid="B48">Lubeck and Cai (2012)</xref>
</td>
</tr>
<tr>
<td align="left">smiFISH</td>
<td align="left">Single molecule inexpensive FISH is easy to uses and flexible techniques used for quantification of RNA molecules in cells</td>
<td align="left">
<xref ref-type="bibr" rid="B70">Tsanov et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">SNV FISH</td>
<td align="left">Single nucleotide variant FISH can detect single-base changes in DNA sequences within cells or tissues</td>
<td align="left">
<xref ref-type="bibr" rid="B41">Levesque et al. (2013)</xref>, <xref ref-type="bibr" rid="B66">Symmons et al. (2019)</xref>
</td>
</tr>
<tr>
<td align="left">inoFISH</td>
<td align="left">inosine FISH allow one to visualize and quantify adenosine-to-inosine edited transcripts <italic>in situ</italic>
</td>
<td align="left">
<xref ref-type="bibr" rid="B51">Mellis et al. (2017)</xref>
</td>
</tr>
<tr>
<td align="left">SABER-FISH</td>
<td align="left">Signal amplification by exchange reaction FISH uses a hybridization-based signal amplification to detect low-abundance RNA targets in cells and tissues</td>
<td align="left">
<xref ref-type="bibr" rid="B39">Kishi et al. (2019)</xref>
</td>
</tr>
<tr>
<td align="left">ClampFISH</td>
<td align="left">Click-amplifying FISH is a improved version of FISH, which have high specificity and signal amplification</td>
<td align="left">
<xref ref-type="bibr" rid="B57">Rouhanifard et al. (2018)</xref>
</td>
</tr>
<tr>
<td align="left">seqFISH&#x2b;</td>
<td align="left">Spatially resolved transcriptomics by FISH enables simultaneous detection of thousands of RNA molecules <italic>in situ</italic>
</td>
<td align="left">
<xref ref-type="bibr" rid="B22">Eng et al. (2019)</xref>
</td>
</tr>
<tr>
<td align="left">MERFISH</td>
<td align="left">Multiplexed Error-Robust FISH can detect and localize thousands of RNA molecules simultaneously within cells</td>
<td align="left">
<xref ref-type="bibr" rid="B16">Chen et al. (2015)</xref>, <xref ref-type="bibr" rid="B80">Xia et al. (2019)</xref>
</td>
</tr>
<tr>
<td colspan="3" align="left">Imaging based biochemical methods</td>
</tr>
<tr>
<td align="left">STARmap</td>
<td align="left">STARmap is hybrid technique that combines hydrogel-tissue chemistry and DNA sequencing to detect expression of genes</td>
<td align="left">
<xref ref-type="bibr" rid="B76">Wang et al. (2018)</xref>
</td>
</tr>
<tr>
<td align="left">HyblSS</td>
<td align="left">Hybridization-based <italic>in situ</italic> sequencing combines <italic>in situ</italic> hybridization with DNA sequencing to identify RNA molecules at the single-cell level</td>
<td align="left">
<xref ref-type="bibr" rid="B32">Gyllborg et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">FISSEQ</td>
<td align="left">Fluorescent <italic>In Situ</italic> Sequencing combines FISH with next generation sequencing for detecting RNA molecules</td>
<td align="left">
<xref ref-type="bibr" rid="B40">Lee et al. (2015)</xref>
</td>
</tr>
<tr>
<td align="left">RNA stem-loop system</td>
<td align="left">The RNA stem-loop system developed for controlled expression of RNA molecules in cells by using a stem-loop structure</td>
<td align="left">
<xref ref-type="bibr" rid="B34">Heinrich et al. (2017)</xref>
</td>
</tr>
<tr>
<td align="left">Cas system</td>
<td align="left">CRISPR-mediated RNA imaging technique involves the use of a modified CRISPR-Cas system to target RNA molecules</td>
<td align="left">
<xref ref-type="bibr" rid="B1">Abudayyeh et al. (2017)</xref>, <xref ref-type="bibr" rid="B17">Chen et al. (2020b)</xref>
</td>
</tr>
<tr>
<td colspan="3" align="left">lncRNA profiling</td>
</tr>
<tr>
<td align="left">RNA-seq</td>
<td align="left">RNA sequencing is a next generation sequencing technology that can be used to sequence lncRNA in a given cell location</td>
<td align="left">
<xref ref-type="bibr" rid="B77">Wang et al. (2009)</xref>
</td>
</tr>
<tr>
<td align="left">Microarray</td>
<td align="left">Microarray RNA profiling is a commonly used technique for measuring expression RNA transcripts</td>
<td align="left">
<xref ref-type="bibr" rid="B60">Schena et al. (1995)</xref>
</td>
</tr>
<tr>
<td align="left">Tiling arrays</td>
<td align="left">Tiling arrays are used to determine genome binding in ChIP assays or to identify transcribed regions</td>
<td align="left">
<xref ref-type="bibr" rid="B7">Bertone et al. (2004)</xref>
</td>
</tr>
<tr>
<td align="left">SAGE CAGE</td>
<td align="left">Cap analysis gene expression, is an extension of SAGE, used for quantifying transcripts including lncRNA</td>
<td align="left">
<xref ref-type="bibr" rid="B71">Velculescu et al. (1995)</xref>, <xref ref-type="bibr" rid="B61">Shiraki et al. (2003)</xref>
</td>
</tr>
<tr>
<td align="left">PARE</td>
<td align="left">Parallel Analysis of RNA Ends allows one to quantify RNA molecules in a sample</td>
<td align="left">
<xref ref-type="bibr" rid="B30">German et al. (2009)</xref>
</td>
</tr>
<tr>
<td align="left">GRO-seq</td>
<td align="left">GRO-seq (Global Run-On sequencing) is a method used to study transcriptional activity of the genome at a global scale</td>
<td align="left">
<xref ref-type="bibr" rid="B29">Gardini (2017)</xref>
</td>
</tr>
<tr>
<td align="left">RIP-Chip</td>
<td align="left">RIP-Chip developed for measuring interaction between RNA and proteins</td>
<td align="left">
<xref ref-type="bibr" rid="B38">Keene et al. (2006)</xref>
</td>
</tr>
<tr>
<td align="left">TIF-seq</td>
<td align="left">Transcription initiation footprinting and sequencing is used to study the initiation of transcription in a genome</td>
<td align="left">
<xref ref-type="bibr" rid="B52">Pelechano et al. (2013)</xref>
</td>
</tr>
<tr>
<td align="left">SHAPE</td>
<td align="left">Selective 2&#x2032;-hydroxyl acylation by primer extension is a high-resolution technique to measure RNA structure</td>
<td align="left">
<xref ref-type="bibr" rid="B62">Smola et al. (2015)</xref>
</td>
</tr>
<tr>
<td align="left">PARS</td>
<td align="left">Parallel Analysis of RNA Structure allow to study structure and function of wide range of RNAs at genome scale</td>
<td align="left">
<xref ref-type="bibr" rid="B73">Wan et al. (2013)</xref>
</td>
</tr>
<tr>
<td colspan="3" align="left" >Biochemical methods</td>
</tr>
<tr>
<td align="left">APEX-RIP</td>
<td align="left">Ascorbate Peroxidase Proximity-Dependent Biotinylation RIP allow to identify RNA-protein interactions at genome scale</td>
<td align="left">
<xref ref-type="bibr" rid="B37">Kaewsapsak et al. (2017)</xref>
</td>
</tr>
<tr>
<td align="left">Biochemical Fractionation &#x2b; RNA-Seq</td>
<td align="left">It is a powerful experimental method for subcellular localization of RNA molecules</td>
<td align="left">
<xref ref-type="bibr" rid="B69">Tilgner et al. (2012)</xref>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="s3-1">
<title>3.1 FISH-based methods</title>
<p>Fluorescence <italic>In Situ</italic> Hybridization (FISH) is a molecular cytogenetic technique commonly used to identify the location of biological molecules like DNA and entire chromosomes in a cell. One of the significant features of FISH is that it allows the detection of many biological molecules simultaneously. Single-molecule FISH (smFISH) is a modified version of FISH for single-cell resolution. It allows for visualizing the localization and abundance of individual RNA molecules within cells or tissues (<xref ref-type="bibr" rid="B25">Femino et al., 1998</xref>; <xref ref-type="bibr" rid="B55">Raj and Tyagi, 2010</xref>; <xref ref-type="bibr" rid="B48">Lubeck and Cai, 2012</xref>). In smFISH, RNA molecules are hybridized with fluorescently labeled probes to generate a fluorescent signal that can be detected using fluorescence microscopy. Single Molecule Inexpensive FISH (smiFISH) is a user-friendly and versatile approach for visualizing and quantifying RNA. It uses fluorescently tagged secondary detector oligonucleotides and unlabeled primary probes (<xref ref-type="bibr" rid="B70">Tsanov et al., 2016</xref>). The primary probes, which are gene-specific, are unlabeled, making them cost-effective to synthesize. This cost advantage allows for using more probes per mRNA, significantly improving detection efficiency. Single-nucleotide variant FISH (SNV-FISH) is a highly sophisticated method that detects single-nucleotide variations in an RNA transcript (<xref ref-type="bibr" rid="B41">Levesque et al., 2013</xref>; <xref ref-type="bibr" rid="B66">Symmons et al., 2019</xref>). One more variety of FISH is inosineFISH or inoFISH, which capture image of adenosine-to-inosine RNA altering occasions with single-particle resolution (<xref ref-type="bibr" rid="B51">Mellis et al., 2017</xref>).</p>
<p>SABER, an acronym for signal amplification by exchange reaction, is a technique that enhances the signals obtained from oligonucleotide-based FISH probes by attaching long, single-stranded DNA chains (<xref ref-type="bibr" rid="B39">Kishi et al., 2019</xref>). It can amplify RNA/DNA signals in cells and tissues. Click-amplifying FISH is a precise method that achieves remarkable signal amplification with a high gain (<xref ref-type="bibr" rid="B57">Rouhanifard et al., 2018</xref>). It allows the detection of RNA species using low-magnification microscopy and RNA-based flow cytometry. Sequential FISH (seqFISH) is an advanced technology that identifies thousands of molecules within single cells while preserving their spatial context (<xref ref-type="bibr" rid="B22">Eng et al., 2019</xref>). SeqFISH allows researchers to obtain super-resolved images that provide insights into genomic-level processes with exceptionally high efficiency and accuracy. Multiplexed error-robust FISH (MERFISH) is a powerful single-molecule imaging technique developed for determining copy numbers of thousands of RNA molecules (<xref ref-type="bibr" rid="B16">Chen et al., 2015</xref>; <xref ref-type="bibr" rid="B80">Xia et al., 2019</xref>). It revolutionizes transcriptome-scale RNA imaging at the single-cell level by utilizing error-robust barcodes to encode individual RNA species. Notably, the MERFISH protocol has undergone updates to enhance detection efficiency, allowing the transcriptome-scale imaging of approximately 1,000 RNA species in single cells.</p>
</sec>
<sec id="s3-2">
<title>3.2 Imaging based biochemical methods</title>
<p>STARmap is a novel approach that allow to measure gene expression at single cell compartment in intact tissue, providing insights into the activity of over a thousand genes (<xref ref-type="bibr" rid="B76">Wang et al., 2018</xref>). In the future, integrating this intact-system gene expression measurement with complementary methodologies will offer cellular-resolution analysis. One of the powerful technologies in this category is <italic>in situ</italic> sequencing (ISS), which utilizes padlock probes and rolling circle amplification. An enhanced version of ISS, known as HybISS (hybridization-based <italic>in situ</italic> sequencing), has been developed to improve the spatial detection of RNA transcripts (<xref ref-type="bibr" rid="B32">Gyllborg et al., 2020</xref>). HybISS incorporates modifications in probe design, enabling a new barcoding system through sequence-by-hybridization chemistry. The HybISS design offers increased flexibility, allowing for enhanced multiplexing and improved signal-to-noise ratio, all while maintaining the efficiency required for imaging large fields of view. Fluorescent <italic>In Situ</italic> Sequencing (FISSEQ) is a molecular technique that allows the simultaneous visualization of RNA molecules and their sequences in intact biological samples (<xref ref-type="bibr" rid="B40">Lee et al., 2015</xref>). FISSEQ uses barcoded oligonucleotide probes to hybridize targeted RNA molecules. These probes are amplified and labeled with fluorescent dyes, allowing the visualization of the RNA molecules. In the widely adopted RNA labeling method, query RNA molecule is labeled with a specific stem-loop. This stem-loop sequence binds to the bacteriophage coat protein and fused to a fluorescent protein that enables the visualization of the labeled RNA using fluorescence microscopy (<xref ref-type="bibr" rid="B34">Heinrich et al., 2017</xref>). Using CRISPR-Cas based RNA imaging, which offers target programmability without genetically altering the target, it is possible to track a variety of endogenous long-chain RNAs (like mRNA) in live cells in real-time (<xref ref-type="bibr" rid="B1">Abudayyeh et al., 2017</xref>; <xref ref-type="bibr" rid="B17">Chen et al., 2020</xref>). The CRISPR-mediated RNA imaging technique involves the use of a modified CRISPR-Cas system that targets specific RNA molecules and recruit fluorescent proteins.</p>
</sec>
<sec id="s3-3">
<title>3.3 RNA-seq based techniques</title>
<p>In the last decade, RNA sequencing (RNA-seq) has been heavily used for a wide range of omics, including a comprehensive analysis of gene expression and sequencing of the transcriptome. It now encompasses various methods that enable the investigation of diverse aspects of RNA biology. Furthermore, the advent of long-read sequencing and direct RNA-seq technologies, coupled with improved computational tools for data analysis, has revolutionized RNA-seq (<xref ref-type="bibr" rid="B77">Wang et al., 2009</xref>). In contrast to classical sequencing technologies, RNA-Seq offers superior coverage and enhanced resolution. Microarray RNA profiling is an older technique that allows the simultaneous detection and quantification of thousands of RNA transcripts in a single experiment (<xref ref-type="bibr" rid="B60">Schena et al., 1995</xref>). This procedure has limitations, including its reliance on pre-designed probes, which may not detect all RNA transcripts. A tiling array consists of short nucleic acid fragments fixed onto a substrate (<xref ref-type="bibr" rid="B7">Bertone et al., 2004</xref>). These arrays are specifically designed to cover the entire genome of the target species. Tiling arrays are widely utilized in various applications, such as ChIP assays, to determine genome binding or to identify transcribed regions. By employing tiling arrays, researchers can obtain valuable insights into the binding patterns of the genome in ChIP assays.</p>
<p>Serial analysis of gene expression (SAGE) is a well-established technique developed to study the transcriptome by identifying and quantifying transcripts, including non-coding RNAs (ncRNAs) (<xref ref-type="bibr" rid="B71">Velculescu et al., 1995</xref>). This method relies on restriction enzymes to generate short, unbiased cDNA sequences known as SAGE tags. It involves several steps, including isolating and converting mRNA into cDNA, cutting the cDNA into smaller fragments, and adding tags to each fragment. The fragments are then combined and sequenced, providing information about which genes are present and how many copies of each gene are being expressed. The limited length of the sequence tags in SAGE may need to provide more information to accurately determine the identity of a new sequence. To address this limitation, a modified version of SAGE that utilizes more extended tags has been developed, demonstrating increased usefulness in transcript identification. Cap analysis gene expression (CAGE) provides information about transcript abundance and promoter identification (<xref ref-type="bibr" rid="B61">Shiraki et al., 2003</xref>). It is a high throughput method that can identify and quantify 5&#x2032; ends of capped RNAs. It has been used for study of RNA subcellular localization (<xref ref-type="bibr" rid="B20">Djebali et al., 2012</xref>) and identification of transcription start sites (<xref ref-type="bibr" rid="B68">ENCODE Project Consortium, 2012</xref>). The PARE is another technology used to identify and quantify small RNA molecules in a sample (<xref ref-type="bibr" rid="B30">German et al., 2009</xref>). PARE works by capturing the 5&#x2032; ends of RNA fragments using a technique called ligation-mediated PCR. It is often used to study the targets and functions of miRNAs.</p>
<p>GRO-seq was developed to study the transcriptional activity of the genome at a global scale. It works by labeling nascent RNA transcripts using BrUTP (bromouridine triphosphate) and isolating and sequencing the labeled RNA molecules (<xref ref-type="bibr" rid="B29">Gardini, 2017</xref>). This method allows researchers to identify the specific genomic regions where transcription occurs and the direction and rate of transcription. GRO-seq is often used to study gene expression regulation and identify novel non-coding RNAs.</p>
<p>RIP-Chip is used for isolating and sequencing RNA transcripts that bind to RNA-binding proteins (<xref ref-type="bibr" rid="B38">Keene et al., 2006</xref>). Various downstream methods, such as high-throughput sequencing, characterize the RNA molecules associated with the RNA binding proteins. RIP is often used to study post-transcriptional regulation of gene expression, particularly the regulation of mRNA stability and translation. Transcript IsoForm Sequencing (TIF-Seq) is a powerful technology that has been used to study transcript isoforms at the genome scale (<xref ref-type="bibr" rid="B52">Pelechano et al., 2013</xref>). In TIF-Seq, both the 5&#x2032; and 3&#x2032; ends are simultaneously sequenced and it allows the user to accurately determine the stand and end sites of individual RNA molecules. Selective 2&#x2032;-hydroxyl acylation analyzed by primer extension (SHAPE) was developed to study the structure and folding of RNA molecules at single nucleotide resolution (<xref ref-type="bibr" rid="B62">Smola et al., 2015</xref>). SHAPE experiments use the reactivity of the RNA ribose 2&#x2032;-OH towards hydroxyl-selective electrophilic reagents to model the secondary and tertiary structure of RNA molecules. PARS is another method for studying RNA structure and folding (<xref ref-type="bibr" rid="B73">Wan et al., 2013</xref>).</p>
</sec>
<sec id="s3-4">
<title>3.4 Biochemical methods</title>
<p>APEX-RIP allows the identification of RNA-protein interactions by combining two techniques: APEX (Ascorbate Peroxidase-mediated Protein Localization and Protein-Protein Interaction Profiling) and RIP (RNA Immunoprecipitation) (<xref ref-type="bibr" rid="B37">Kaewsapsak et al., 2017</xref>). APEX-RIP has been used to identify RNA-binding proteins and their associated RNAs in a variety of systems, including cancer cells, neuronal cells, and embryonic stem cells. Biochemical fractionation is a technique used to isolate specific cellular components or organelles from complex mixtures such as whole cells or tissues. The distribution and expression of RNA molecules in different subcellular fractions is studied by combining biochemical fractionation and RNA-seq (<xref ref-type="bibr" rid="B69">Tilgner et al., 2012</xref>). By fractionating cells or tissues into different organelles or subcellular compartments, researchers can isolate RNAs that are localized or enriched in specific cell regions. This approach has been used to study various aspects of RNA biology, including RNA localization.</p>
</sec>
</sec>
<sec id="s4">
<title>4 Creation of datasets by different tools</title>
<p>Majority of the datasets used by the tools are derived from RNALocate or ENCODE RNA-seq data. An overview of datasets published by existing methods has been provided in <xref ref-type="table" rid="T3">Table 3</xref>.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Summary of datasets used in existing subcellular localization tools.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Tools</th>
<th align="left"/>
<th align="right">Cytoplasm</th>
<th align="right">Cytosol</th>
<th align="right">Exosome</th>
<th align="right">Nucleus</th>
<th align="right">Ribosome</th>
<th align="right">Total</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">lncLocator</td>
<td align="left">Benchmark</td>
<td align="right">301</td>
<td align="right">91</td>
<td align="right">25</td>
<td align="right">152</td>
<td align="right">43</td>
<td align="right">612</td>
</tr>
<tr>
<td align="left">iLoc-lncRNA</td>
<td align="left">Benchmark</td>
<td align="right">426</td>
<td align="left"/>
<td align="right">30</td>
<td align="right">156</td>
<td align="right">43</td>
<td align="right">655</td>
</tr>
<tr>
<td align="left">DeepLncRNA</td>
<td align="left">Benchmark</td>
<td align="left"/>
<td align="right">4,380</td>
<td align="left"/>
<td align="right">4,298</td>
<td align="left"/>
<td align="right">8,678</td>
</tr>
<tr>
<td align="left">LncLocation</td>
<td align="left">Benchmark</td>
<td align="right">426</td>
<td align="left"/>
<td align="right">240</td>
<td align="right">344</td>
<td align="right">314</td>
<td align="right">1,324</td>
</tr>
<tr>
<td align="left">Locate-R</td>
<td align="left">Benchmark</td>
<td align="right">426</td>
<td align="left"/>
<td align="right">240</td>
<td align="right">314</td>
<td align="right">344</td>
<td align="right">1,324</td>
</tr>
<tr>
<td rowspan="2" align="left">lncLocPred</td>
<td align="left">Benchmark</td>
<td align="right">426</td>
<td align="left"/>
<td align="right">30</td>
<td align="right">156</td>
<td align="right">43</td>
<td align="right">655</td>
</tr>
<tr>
<td align="left">Independent</td>
<td align="right">199</td>
<td align="left"/>
<td align="right">16</td>
<td align="right">82</td>
<td align="right">99</td>
<td align="right">396</td>
</tr>
<tr>
<td rowspan="2" align="left">KD-KLNMF</td>
<td align="left">Benchmark</td>
<td align="right">417</td>
<td align="left"/>
<td align="right">417</td>
<td align="right">417</td>
<td align="right">417</td>
<td align="right">1,668</td>
</tr>
<tr>
<td align="left">Independent</td>
<td align="right">14</td>
<td align="left"/>
<td align="right">35</td>
<td align="right">45</td>
<td align="right">84</td>
<td align="right">178</td>
</tr>
<tr>
<td rowspan="2" align="left">DeepLncLoc</td>
<td align="left">Benchmark</td>
<td align="right">328</td>
<td align="right">88</td>
<td align="right">28</td>
<td align="right">325</td>
<td align="right">88</td>
<td align="right">857</td>
</tr>
<tr>
<td align="left">Test</td>
<td align="right">20</td>
<td align="right">10</td>
<td align="right">7</td>
<td align="right">20</td>
<td align="right">10</td>
<td align="right">67</td>
</tr>
<tr>
<td rowspan="3" align="left">GM-lncLoc</td>
<td align="left">Dataset1</td>
<td align="right">292</td>
<td align="right">292</td>
<td align="right">292</td>
<td align="right">292</td>
<td align="right">292</td>
<td align="right">1,460</td>
</tr>
<tr>
<td align="left">Dataset2</td>
<td align="right">417</td>
<td align="left"/>
<td align="right">417</td>
<td align="right">417</td>
<td align="right">417</td>
<td align="right">1,668</td>
</tr>
<tr>
<td align="left">Independent set</td>
<td align="right">198</td>
<td align="left"/>
<td align="right">16</td>
<td align="right">82</td>
<td align="right">99</td>
<td align="right">395</td>
</tr>
<tr>
<td rowspan="2" align="left">GraphLncLoc</td>
<td align="left">Benchmark</td>
<td align="right">328</td>
<td align="left"/>
<td align="right">28</td>
<td align="right">325</td>
<td align="right">88</td>
<td align="right">769</td>
</tr>
<tr>
<td align="left">Independent</td>
<td align="right">20</td>
<td align="left"/>
<td align="right">7</td>
<td align="right">20</td>
<td align="right">10</td>
<td align="right">57</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="s4-1">
<title>4.1 RNALocate based methods</title>
<p>RNAlocate is a comprehensive resource that provides information on the subcellular localization of different types of RNA molecules (<xref ref-type="bibr" rid="B84">Zhang et al., 2017</xref>). The current version of RNALocate contains a vast collection of over 37,700 manually curated entries, each supported by experimental evidence of RNA-associated subcellular localization. The database encompasses more than 21,800 coding and non-coding RNAs across 65 species. It covers a wide range of 42 subcellular locations, focusing on <italic>Homo sapiens</italic> and <italic>Mus musculus</italic>. RNALocate is a valuable repository for researchers seeking knowledge about RNA localization and its functional implications. The wealth of data available in RNALocate has been utilized in the development of several popular datasets. Notably, it has contributed to creating datasets used in lncLocator (<xref ref-type="bibr" rid="B13">Cao et al., 2018</xref>) and iLoc-lncRNA (<xref ref-type="bibr" rid="B64">Su et al., 2018</xref>). These resources leverage the comprehensive information provided by RNALocate to enhance the study of subcellular localization patterns in long non-coding RNAs (lncRNAs) and other RNA molecules.</p>
<p>The dataset for lncLocator was extracted from RNALocate version 1 (<xref ref-type="bibr" rid="B84">Zhang et al., 2017</xref>). A total of 1,361 lncRNA entries with curated subcellular localization were retrieved from the RNAlocate database, and multiple entries for the same lncRNA were combined. Only those lncRNA were retained, with their sequence information in NCBI (<xref ref-type="bibr" rid="B59">Sayers et al., 2022</xref>) and Ensembl (<xref ref-type="bibr" rid="B19">Cunningham et al., 2022</xref>). Seven subcellular locations were used for classification, and there were 19 combinations of these locations in the dataset. Redundancy was removed using CD-HIT, which was used to remove sequences with more than 80% similarity. Multi-locational lncRNAs were removed, and lncRNAs associated with only one location were allowed. Two locations (Endoplasmic reticulum and synapse) were removed as they had very few samples. Finally, a dataset of 612 lncRNA was created, covering five subcellular locations.</p>
<p>The dataset used in iLoc-lncRNA (<xref ref-type="bibr" rid="B64">Su et al., 2018</xref>) was created from RNALocate version 1 (<xref ref-type="bibr" rid="B84">Zhang et al., 2017</xref>). 923 lncRNA sequences with annotated subcellular localizations were obtained, and CD-HIT reduced redundancy at 80% similarity. After removing similar sequences, 655 non-redundant lncRNA sequences were obtained. The dataset comprises 156 lncRNAs from the nucleus, 426 lncRNAs from the cytoplasm, 43 lncRNAs from the ribosome, and S4 contains 30 lncRNAs from the exosome. This dataset was also used in lncLocation, Locate-R, and lncLocPred.</p>
<p>The training dataset used in KD-KLNMF (<xref ref-type="bibr" rid="B83">Zhang and Qiao, 2020</xref>) is obtained from <xref ref-type="bibr" rid="B81">Yang et al. (2020)</xref>, where they have used 923 sequences for the training dataset. CD-HIT was used at a similarity index threshold of 80% to remove redundant sequences from the dataset. The final training dataset contains 644 lncRNA sequences - 154 sequences from the nucleus, 417 sequences from the cytoplasm, 43 from the ribosome, and 30 from the exosome. In order to balance the dataset, SMOTE (Synthetic Minority Oversampling Technique) was applied to the dataset multiple times post-feature extraction, such that the number of samples in the minority classes equaled that of the majority class. In DeepLncLoc, LncRNAs located in only one location were selected for model construction, the dataset was created from RNALocate v1 (<xref ref-type="bibr" rid="B82">Zeng et al., 2022</xref>). GM-lncLoc (<xref ref-type="bibr" rid="B12">Cai et al., 2023</xref>) obtained datasets from iLoc-lncRNA and lncLocator, which were originally extracted from RNALocate. Both datasets were subjected to oversampling using SMOTE, and all the classes were equally represented. Dataset1 had 292 lncRNA samples, while dataset2 had 417 samples. Also, an independent dataset was created using the test dataset from DeepLncLoc. GraphLncLoc (<xref ref-type="bibr" rid="B43">Li et al., 2023</xref>) uses the benchmark dataset of DeepLncLoc for training their graph convolution network-based model.</p>
</sec>
<sec id="s4-2">
<title>4.2 RNA-seq derived datasets</title>
<p>Apart from RNALocate, some methods have used RNA-seq data to generate localization data by quantifying the gene expression in subcellular locations.</p>
<p>DeepLncRNA (<xref ref-type="bibr" rid="B68">ENCODE Project Consortium, 2012</xref>) used 93 RNA-seq samples from 14 human immortalized cell lines from the ENCODE database (<xref ref-type="bibr" rid="B68">ENCODE Project Consortium, 2012</xref>), of which 45 were from the cytosol, and 48 were from the nucleus. Differential transcript expression was used to quantify the differences in lncRNA transcript abundances between nuclear and cytosolic cellular fractions for each cell type. Log2 fold change was used to determine enrichment in the nucleus or cytosol. A sequence was assigned to the cytosol if the log2 fold change &#x3c;0, and it will be assigned to the nucleus if the log2 fold change &#x3e;2.8. Applying this log2 fold change threshold resulted in a dataset containing 4,380 cytosolic lncRNAs and 4,298 nuclear lncRNAs.</p>
<p>LncLocator 2.0 (<xref ref-type="bibr" rid="B46">Lin et al., 2021</xref>) sourced data from two databases&#x2014;nucleotide sequences from the GENCODE (<xref ref-type="bibr" rid="B27">Frankish et al., 2019</xref>) project and localization information from lncATLAS (<xref ref-type="bibr" rid="B50">Mas-Ponte et al., 2017</xref>), combined by using common gene IDs. lncATLAS uses relative concentration index (RCI) for quantifying subcellular localization. RCI is defined as the log ratio between concentrations measured by Fragments Per Kilobase Million (FPKM) in two samples (Cytoplasm/Nucleus). Different numbers of lncRNA samples are available based on the type of cell line as they have filtered out the lncRNA with Cytoplasm/Nucleus RCI in the range [&#x2212;1, 1]. The dataset used in lncLocator 2.0 was also used to develop the model in TACOS (<xref ref-type="bibr" rid="B36">Jeon et al., 2022</xref>), which is also a cell-line-specific predictor. However, TACOS utilizes only ten cell lines to develop their classifier.</p>
</sec>
</sec>
<sec id="s5">
<title>5 Methods and their performance</title>
<p>Over the past few years, there have been several advancements in predicting the subcellular localization of lncRNA sequences. Typically, these advancements involve utilizing machine learning techniques to create prediction models, with Support Vector Machine (SVM) being the most frequently employed algorithm. However, recent progress has shifted towards deep learning-based methods, which eliminate the need for manual feature selection and improve performance on benchmark datasets. For a comprehensive overview of the current tools available for subcellular localization prediction, please see <xref ref-type="table" rid="T4">Table 4</xref>. Additionally, <xref ref-type="table" rid="T5">Table 5</xref> provides information regarding the efficacy of these tools in terms of predictive accuracy and other evaluation metrics.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Summary of the existing subcellular localization prediction tools.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Method</th>
<th align="left">Year</th>
<th align="left">Feature</th>
<th align="left">Algorithm</th>
<th align="left">Number of subcellular compartments</th>
<th align="left">Citation</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">lncLocator<xref ref-type="table-fn" rid="Tfn1">
<sup>a</sup>
</xref>
</td>
<td align="left">2018</td>
<td align="left">k-mer</td>
<td align="left">Random forest, SVM, Autoencoder</td>
<td align="left">5 (Nucleus, Ribosome, Cytoplasm, Exosome, Cytosol)</td>
<td align="left">
<xref ref-type="bibr" rid="B13">Cao et al. (2018)</xref>
</td>
</tr>
<tr>
<td align="left">iLoc-lncRNA</td>
<td align="left">2018</td>
<td align="left">PseKNC</td>
<td align="left">SVM</td>
<td align="left">4 (Nucleus, Ribosome, Cytoplasm, Exosome)</td>
<td align="left">
<xref ref-type="bibr" rid="B64">Su et al. (2018)</xref>
</td>
</tr>
<tr>
<td align="left">DeepLncRNA</td>
<td align="left">2018</td>
<td align="left">k-mer, Genome loci, RNA binding motifs</td>
<td align="left">Neural Networks</td>
<td align="left">2 (Nucleus/Cytosol)</td>
<td align="left">
<xref ref-type="bibr" rid="B31">Gudenas and Wang (2018)</xref>
</td>
</tr>
<tr>
<td align="left">LncLocation</td>
<td align="left">2020</td>
<td align="left">k-mer, physico-chemical properties</td>
<td align="left">SVM</td>
<td align="left">4 (Nucleus, Ribosome, Cytoplasm, Exosome)</td>
<td align="left">
<xref ref-type="bibr" rid="B26">Feng et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Locate-R<sup>&#x23;2</sup>
</td>
<td align="left">2020</td>
<td align="left">k-mer, n-gapped k-mer</td>
<td align="left">Locally deep SVM</td>
<td align="left">4 (Nucleus, Ribosome, Cytoplasm, Exosome)</td>
<td align="left">
<xref ref-type="bibr" rid="B2">Ahmad et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">lncLocPred</td>
<td align="left">2020</td>
<td align="left">k-mer, PseDNC</td>
<td align="left">Logistic regression</td>
<td align="left">4 (Nucleus, Ribosome, Cytoplasm, Exosome)</td>
<td align="left">
<xref ref-type="bibr" rid="B24">Fan et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">KD-KLNMF</td>
<td align="left">2020</td>
<td align="left">k-mer, Di-nucleotide-based spatial autocorrelation</td>
<td align="left">SVM</td>
<td align="left">4 (Nucleus, Ribosome, Cytoplasm, Exosome)</td>
<td align="left">
<xref ref-type="bibr" rid="B83">Zhang and Qiao (2020)</xref>
</td>
</tr>
<tr>
<td align="left">lncLocator 2.0</td>
<td align="left">2021</td>
<td align="left">Word embedded sequences</td>
<td align="left">GloVe &#x2b; CNN &#x2b; BiLSTM &#x2b; MLP</td>
<td align="left">2 (Nucleus/Cytoplasm)</td>
<td align="left">
<xref ref-type="bibr" rid="B46">Lin et al. (2021)</xref>
</td>
</tr>
<tr>
<td align="left">DeepLncLoc</td>
<td align="left">2022</td>
<td align="left">k-mer, Subsequence embedding</td>
<td align="left">TextCNN</td>
<td align="left">5 (Nucleus, Ribosome, Cytoplasm, Exosome, Cytosol)</td>
<td align="left">
<xref ref-type="bibr" rid="B82">Zeng et al. (2022)</xref>
</td>
</tr>
<tr>
<td align="left">TACOS</td>
<td align="left">2022</td>
<td align="left">Composition-based, Dinucleotide physicochemical properties</td>
<td align="left">AdaBoost</td>
<td align="left">2 (Nucleus/Cytoplasm)</td>
<td align="left">
<xref ref-type="bibr" rid="B36">Jeon et al. (2022)</xref>
</td>
</tr>
<tr>
<td align="left">GM-lncLoc<xref ref-type="table-fn" rid="Tfn2">
<sup>b</sup>
</xref>
</td>
<td align="left">2023</td>
<td align="left">k-mer</td>
<td align="left">GCN based on MAML</td>
<td align="left">4/5 (Nucleus, Ribosome, Cytoplasm, Exosome)/Cytosol</td>
<td align="left">
<xref ref-type="bibr" rid="B12">Cai et al. (2023)</xref>
</td>
</tr>
<tr>
<td align="left">GraphLncLoc</td>
<td align="left">2023</td>
<td align="left">de Brujin Graphs</td>
<td align="left">Graph Convolution Networks</td>
<td align="left">4 (Nucleus, Ribosome, Cytoplasm, Exosome)</td>
<td align="left">
<xref ref-type="bibr" rid="B43">Li et al. (2023a)</xref>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn1">
<label>
<sup>a</sup>
</label>
<p>SOS oversampling.</p>
</fn>
<fn id="Tfn2">
<label>
<sup>b</sup>
</label>
<p>SMOTE oversampling.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Performance of existing subcellular localization prediction tools.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Metrics</th>
<th align="left"/>
<th align="left">Sensitivity/Recall (%)</th>
<th align="right">Specificity (%)</th>
<th align="right">Precision (%)</th>
<th align="right">Accuracy (%)</th>
<th align="right">MCC</th>
<th align="right">F1-score</th>
<th align="right">AUC</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">lncLocator</td>
<td align="left">Overall</td>
<td align="right">36.3</td>
<td align="left"/>
<td align="left"/>
<td align="right">59.1</td>
<td align="left"/>
<td align="right">0.367</td>
<td align="left"/>
</tr>
<tr>
<td rowspan="5" align="left">iLoc-lncRNA</td>
<td align="left">Nucleus</td>
<td align="right">77.56</td>
<td align="right">97.59</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.796</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Cytoplasm</td>
<td align="right">99.06</td>
<td align="right">67.68</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.742</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Ribosome</td>
<td align="right">46.51</td>
<td align="right">99.83</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.652</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Exosome</td>
<td align="right">16.67</td>
<td align="right">1</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.4</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Overall</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">86.72</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">DeepLncRNA</td>
<td align="left"/>
<td align="right">83</td>
<td align="right">62.4</td>
<td align="left"/>
<td align="right">72.4</td>
<td align="right">0.451</td>
<td align="right">0.744</td>
<td align="right">0.787</td>
</tr>
<tr>
<td rowspan="5" align="left">LncLocation</td>
<td align="left">Nucleus</td>
<td align="right">74.19</td>
<td align="left"/>
<td align="right">95.83</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Cytoplasm</td>
<td align="right">100</td>
<td align="left"/>
<td align="right">85</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Ribosome</td>
<td align="right">55.56</td>
<td align="left"/>
<td align="right">100</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Exosome</td>
<td align="right">33.33</td>
<td align="left"/>
<td align="right">100</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Overall</td>
<td align="right">87.78</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td rowspan="5" align="left">Locate-R</td>
<td align="left">Nucleus</td>
<td align="right">65.92</td>
<td align="right">95.15</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.658</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Cytoplasm</td>
<td align="right">84.74</td>
<td align="right">89.1</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.725</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Ribosome</td>
<td align="right">100</td>
<td align="right">98.37</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.97</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Exosome</td>
<td align="right">100</td>
<td align="right">99.17</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.978</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Overall</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">90.69</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td rowspan="5" align="left">lncLocPred</td>
<td align="left">Nucleus</td>
<td align="right">96.79</td>
<td align="right">96.79</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.915</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Cytoplasm</td>
<td align="right">99.06</td>
<td align="right">85.59</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.876</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Ribosome</td>
<td align="right">60.47</td>
<td align="right">99.84</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.751</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Exosome</td>
<td align="right">20</td>
<td align="right">100</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.439</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Overall</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">92.37</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td rowspan="5" align="left">KD-KLNMF</td>
<td align="left">Nucleus</td>
<td align="right">90.65</td>
<td align="right">99.52</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.928</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Cytoplasm</td>
<td align="right">98.56</td>
<td align="right">96.8</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.93</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Ribosome</td>
<td align="right">99.76</td>
<td align="right">100</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.998</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Exosome</td>
<td align="right">100</td>
<td align="right">100</td>
<td align="left"/>
<td align="left"/>
<td align="right">1</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Overall</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">97.24</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.9981</td>
</tr>
<tr>
<td align="left">lncLocator 2.0</td>
<td align="left">15 cell lines (min-max)</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left">0.6088&#x2013;0.8499</td>
</tr>
<tr>
<td rowspan="6" align="left">DeepLncLoc</td>
<td align="left">Nucleus</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">0.67</td>
</tr>
<tr>
<td align="left">Cytoplasm</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">0.76</td>
</tr>
<tr>
<td align="left">Ribosome</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">0.657</td>
</tr>
<tr>
<td align="left">Exosome</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">0.804</td>
</tr>
<tr>
<td align="left">Cytosol</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">0.806</td>
</tr>
<tr>
<td align="left">Overall</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">54.8</td>
<td align="left"/>
<td align="right">0.421</td>
<td align="right">0.82</td>
</tr>
<tr>
<td align="left">TACOS</td>
<td align="left">Overall (10 cell-lines)</td>
<td align="right">77.72</td>
<td align="right">72.81</td>
<td align="left"/>
<td align="right">75.26</td>
<td align="right">0.5064</td>
<td align="left"/>
<td align="right">0.8339</td>
</tr>
<tr>
<td rowspan="6" align="left">GM-lncLoc</td>
<td align="left">Overall (Dataset1)</td>
<td align="right">93.3</td>
<td align="left"/>
<td align="left"/>
<td align="right">93.4</td>
<td align="left"/>
<td align="right">0.933</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Nucleus (Dataset2)</td>
<td align="right">88.85</td>
<td align="right">98.21</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.889</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Cytoplasm (Dataset2)</td>
<td align="right">93.21</td>
<td align="right">96.06</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.879</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Ribosome (Dataset2)</td>
<td align="right">96.8</td>
<td align="right">98.99</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.959</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Exosome (Dataset2)</td>
<td align="right">99.07</td>
<td align="right">99.38</td>
<td align="left"/>
<td align="left"/>
<td align="right">0.982</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Overall (Dataset2)</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="right">94.2</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">GraphLncLoc</td>
<td align="left">Overall</td>
<td align="left">47.5</td>
<td align="left"/>
<td align="left">69.1</td>
<td align="right">61.2</td>
<td align="left"/>
<td align="left">0.506</td>
<td align="left"/>
</tr>
</tbody>
</table>
</table-wrap>
<p>LncLocator (<xref ref-type="bibr" rid="B13">Cao et al., 2018</xref>) used an unsupervised stacked autoencoder (AE) engine that deployed on k-mer features to learn efficient data representations. Both the raw and autoencoded features were used for training the models. lncLocator achieves accuracy, F1-score, and recall of 0.591, 0.367, and 0.363, respectively, on the oversampled dataset, whereas the accuracy, F1-score, and recall of the method on the original dataset were 0.598, 0.343 and 0.356, respectively. iLoc-lncRNA (<xref ref-type="bibr" rid="B64">Su et al., 2018</xref>) is an SVM-ensemble method that utilizes a combination of Pseudo K-tuple Nucleotide Composition and 8-mer composition. Furthermore, feature selection was performed using Iterative Feature Selection (IFS). lncLocation (<xref ref-type="bibr" rid="B26">Feng et al., 2020</xref>) utilizes a combination of multiple features for training its model. These features encompass different aspects such as sequence composition, basic lncRNA characteristics, physical-chemical properties, and multi-scale secondary structural features. Additionally included are multi-scale secondary structural characteristics and physicochemical properties. By considering multiple feature combinations and utilizing SVM, lncLocation achieves its predictive capabilities for the given task.</p>
<p>Locate-R (<xref ref-type="bibr" rid="B2">Ahmad et al., 2020</xref>) was developed using k-mer and n-gapped k-mer composition as features. The value of k was varied from 1-6 while generating k-mers and, in the process, generating 5,460 features. N-gapped k-mer composition was also used, where the number of gaps n, was varied from 1-10, and the value of k was varied from 1 to 3. 39,312 new features were generated using n-gapped k-mer composition. A non-linear version of SVM, called locally deep support vector machine (LD-SVM), was used for developing the model. The model achieved an overall accuracy of 90.69%. lncLocPred (<xref ref-type="bibr" rid="B24">Fan et al., 2020</xref>) is based on a logistic regression model and three different types of features. The selected k-mer features were merged with two other types of features&#x2014;Pseudo-Dinucleotide Composition (PseDNC) and Local Structure-Sequence Triplet Element (Triplet). While Triplet makes use of the structural information of RNA sequences, PseDNC uses the sequential information and physicochemical characteristics of the nucleotide sequence. F-score-based feature selection was applied to this set of features, and an optimal set of features was obtained. lncLocPred manages to achieve an overall accuracy of 92.37%, which is an improvement of 2% over other state-of-the-art tools.</p>
<p>KD-KLNMF (<xref ref-type="bibr" rid="B83">Zhang and Qiao, 2020</xref>) employed k-mer composition and dinucleotide-based spatial autocorrelation for generating features. Kullback-Leibler divergence-based nonnegative matrix factorization (KLNMF) was employed as a feature selection method to enhance the features&#x2019; effectiveness. The Support Vector Machine (SVM) with a Radial Basis Function (RBF) kernel demonstrated the best performance among various classifiers. The model achieved an impressive overall accuracy of 97.24%, as determined by the jackknife test. DeepLncLoc (<xref ref-type="bibr" rid="B82">Zeng et al., 2022</xref>) utilizes deep learning algorithms and natural language processing techniques to develop a classifier for subcellular localization. The generation of features in DeepLncLoc involves subsequence embedding. Following subsequence embedding, an average pooling layer is used to capture the patterns of each subsequence, resulting in a matrix representation of the lncRNA sequence. Lastly, a textCNN is employed to learn high-level features and perform the prediction task. GM-lncLoc (<xref ref-type="bibr" rid="B12">Cai et al., 2023</xref>) used a Graph Convolution Network along with Model-agnostic meta-learning to develop the classification model.</p>
<p>Methods developed using RNA-seq data are primarily binary classifiers. They are designed to compare the expression of lncRNA between two locations. DeepLncRNA (<xref ref-type="bibr" rid="B31">Gudenas and Wang, 2018</xref>) uses a neural network to classify lncRNA samples into cytoplasm/nucleus based on their location labels. Three different types of features were combined to generate a feature set for the dataset. Genome loci and the presence of RNA-binding protein motifs were also used as features. lncLocator 2.0 (<xref ref-type="bibr" rid="B46">Lin et al., 2021</xref>) is a regression-based tool that predicts the Cytosol/Nucleus Relative Concentration Index (CNCRI). lncLocator 2.0 uses GloVe for sequence embedding and generating word vectors for downstream training. CNN is used for learning features from the word vectors. CNN and Bi-LSTM structure take the word vectors as the input and obtain a fixed-length feature vector. This fixed-length vector is provided to an MLP classifier, which uses the continuous CNRCI values and acts as a regressor model.</p>
</sec>
<sec id="s6">
<title>6 Challenges and future perspectives</title>
<p>The remarkable progress in experimental techniques has significantly contributed to the generation of large-scale data on lncRNAs. Fluorescence <italic>in situ</italic> hybridization (FISH), initially developed for visualizing single nucleotide targets, has evolved over time to enable the visualization of thousands of nucleotide targets at single-cell resolution. However, despite the advancements, the data produced by these methods are often not readily available in the form of public databases. One primary disadvantage of FISH-based methods is that they do not allow <italic>de novo</italic> identification of transcripts due to the requirement of probes. Also, when multiplexing is performed, overcrowding of signals can cause issues in the detection of transcripts. It has been observed that the detection efficiency drops with increasing RNA targets. Amplification of signals by techniques like hybridization chain reaction can create artifacts and increase the number of false positives. Identification and decoding barcodes, in the case of multiplexed RNA-FISH techniques, require complex software and heavy computational power.</p>
<p>Profiling methods have also made considerable strides, transitioning from microarrays to bulk RNA-seq and eventually to single-cell sequencing. The improved annotation of lncRNAs by resources like GENCODE has facilitated the quantification of lncRNA expression. However, single-cell expression data poses its own set of challenges, primarily related to low read counts of lncRNA transcripts. Unlike protein-coding genes, lncRNAs often lack well-defined functional domains, making their functional characterization more challenging using sequencing data alone.</p>
<p>Despite these challenges, the continuous advancement of experimental techniques and annotation resources has significantly enhanced our understanding of lncRNAs. Future efforts should focus on addressing the limitations associated with data availability, cost, and functional characterization. By promoting data-sharing practices, ensuring comprehensive annotations, and integrating complementary experimental approaches, we can overcome these obstacles and gain deeper insights into the functional roles and mechanisms of lncRNAs.</p>
<p>The field of lncRNA research has witnessed the development of numerous databases aimed at facilitating sequence and functional annotation. These comprehensive databases encompass various aspects related to lncRNAs, including sequence annotation, expression data, functional annotation, disease associations, and subcellular localization. Such resources have become indispensable in managing the vast volumes of data generated by high-throughput methods. However, certain limitations hinder the full utility of these databases. One prevalent issue is the outdated nature of some databases. Several well-known databases, such as LNCpedia and LncRNADisease2, have not been updated since 2018, rendering them inadequate for covering the newly generated lncRNA sequences. This lack of timely updates limits their relevance and usefulness within the rapidly evolving field. Another significant problem lies in the lack of uniformity in the naming nomenclature of lncRNA sequences across different annotation databases. Each database tends to assign its own set of names to the lncRNA sequences, resulting in confusion and defeating the purpose of accurate annotation. This inconsistency hampers effective data integration and comparability across databases. Furthermore, when it comes to subcellular localization, lncATLAS, a database specifically focused on this aspect, falls short. Last updated in 2017, lncATLAS only covers two subcellular locations, namely, the nucleus and cytoplasm. This limited coverage restricts the usability of the data, as other existing databases include annotations for major organelles beyond the nucleus and cytoplasm. Outdated databases fail to keep pace with the rapid expansion of lncRNA knowledge, naming inconsistencies hinder integration, and the limited coverage of subcellular localization databases restricts their applicability. Overcoming these limitations is essential for enhancing the effectiveness and utility of lncRNA annotation databases in advancing our understanding of these important regulatory molecules.</p>
<p>A primary challenge in the area of subcellular localization is the scarcity of sufficient training and validation data for developing prediction methods. The training datasets used to develop these prediction tools are often limited in size and diversity, which can impact the accuracy and robustness of the predictions. With the exception of RNALocate, there is a lack of well-annotated databases that provide comprehensive subcellular localization information. Many existing prediction tools rely on data from RNALocate version 1, even though an updated version 2 was released in 2021. Additionally, cell-line-specific subcellular localization information available in ENCODE is underutilized despite its potential relevance. RNA-seq data, which is commonly used for localization prediction, can be noisy and prone to inaccuracies due to variations in expression values caused by differing cell states and analysis workflows. Moreover, it has been observed that the localization of lncRNAs can vary between fixed cells and live cells, adding another layer of complexity to the prediction process. Currently, the MERFISH technique provides a promising solution by enabling the identification of RNAs associated with subcellular compartments with high sensitivity and low false discovery rates at a genome-wide scale. The availability of MERFISH datasets would greatly enhance researchers&#x2019; ability to quantify subcellular localization more accurately. Addressing these limitations will require concerted efforts to expand and diversify training datasets. Recent advances in spatial transcriptomics, enables the profiling of transcripts at subcellular resolution, providing insights into the spatial localization of RNAs within cells. This technique has become increasingly important in understanding the complex regulation of gene expression within cells, particularly in the context of disease formation and cellular processes. The availability of image data generated from spatial transcriptomics techniques offers a rich resource for investigating the spatial expression patterns of genes in different cell types and in response to environmental stimuli. These datasets can be used to identify the spatial distribution of RNAs within cells, which is crucial for understanding cellular processes such as RNA localization and its role in disease.</p>
<p>Despite the advancements in lncRNA subcellular localization prediction, the current methods still face limitations in terms of their accuracy, and further research is necessary to improve their performance. While these tools may demonstrate high accuracy when evaluated on their own training datasets, their performance on independent datasets remains notably poor. For instance, lncLocPred, Locate-R, and iLoc-lncRNA exhibited high accuracy rates of 92.37%, 90.69%, and 86.72%, respectively, on their training datasets. However, when these methods were tested on an independent dataset, their accuracies dropped significantly to 44.44%, 38.64%, and 35.86%, respectively. This decline in performance suggests the presence of bias in the machine-learning algorithms used by these methods. A similar trend was observed when GM-LncLoc compared its own method with iLoc-lncRNA, Locate-R, and lncLocPred based on an independent dataset. While these models achieved high accuracies of 94.20%, 86.72%, 90.69%, and 92.39% on their training datasets, their accuracy drastically decreased to 46.21%, 35.86%, 38.64%, and 44.44%, respectively, on the independent dataset. These findings underscore the need for further investigation into the underlying biases and limitations of current machine-learning algorithms employed in lncRNA subcellular localization prediction.</p>
</sec>
<sec sec-type="conclusion" id="s7">
<title>7 Conclusion</title>
<p>Despite all the challenges, functional annotation has made significant progress over the last few years. The generation of data using high throughput techniques should be prioritized, and the data should be made publicly accessible using well-annotated databases. The availability of large volumes of data will lead to the development of better subcellular localization prediction tools. Improved algorithms, training datasets, and rigorous validation of independent datasets are essential for the development of more accurate and robust lncRNA subcellular localization prediction methods.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s8">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://webs.iiitd.edu.in/raghava/lncinfo/index.php">https://webs.iiitd.edu.in/raghava/lncinfo/index.php</ext-link>.</p>
</sec>
<sec id="s9">
<title>Author contributions</title>
<p>SC: Conceptualization, Data curation, Formal Analysis, Investigation, Methodology, Validation, Visualization, Writing&#x2013;original draft, Writing&#x2013;review and editing. AR: Data curation, Investigation, Methodology, Writing&#x2013;original draft, Writing&#x2013;review and editing. GR: Conceptualization, Formal Analysis, Funding acquisition, Investigation, Project administration, Resources, Supervision, Writing&#x2013;original draft, Writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s10">
<title>Funding</title>
<p>The authors declare that financial support was received for the research, authorship, and/or publication of this article. This work was supported by the BIC grant from Department of Biotechnology, India (BT/PR40158/BTIS/137/24/2021).</p>
</sec>
<ack>
<p>Authors also are thankful to the Department of Science and Technology (DST-INSPIRE) and University Grants Commission (UGC) for fellowships and the financial support. Authors are also thankful to Department of Computational Biology, IIITD New Delhi for infrastructure and facilities. We thank the Department of Biotechnology (DBT) for providing an infrastructure grant to the institute (Grant BT/PR40158/BTIS/137/24/2021).</p>
</ack>
<sec sec-type="COI-statement" id="s11">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
<p>The authors declared that they were an editorial board member of Frontiers, at the time of submission. This had no impact on the peer review process and the final decision.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abudayyeh</surname>
<given-names>O. O.</given-names>
</name>
<name>
<surname>Gootenberg</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Essletzbichler</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Joung</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Belanto</surname>
<given-names>J. J.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>RNA targeting with CRISPR-Cas13</article-title>. <source>Nature</source> <volume>550</volume>, <fpage>280</fpage>&#x2013;<lpage>284</lpage>. <pub-id pub-id-type="doi">10.1038/nature24049</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmad</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Shatabda</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Locate-R: subcellular localization of long non-coding RNAs using nucleotide compositions</article-title>. <source>Genomics</source> <volume>112</volume>, <fpage>2583</fpage>&#x2013;<lpage>2589</lpage>. <pub-id pub-id-type="doi">10.1016/j.ygeno.2020.02.011</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andjus</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Szachnowski</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Vogt</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Gioftsidi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hatin</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Cornu</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Pervasive translation of Xrn1-sensitive unstable long non-coding RNAs in yeast</article-title>. <source>RNA</source> <volume>30</volume>, <fpage>662</fpage>&#x2013;<lpage>679</lpage>. <pub-id pub-id-type="doi">10.1261/rna.079903.123</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Asim</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Ibrahim</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Imran Malik</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dengel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Advances in computational methodologies for classification and sub-cellular locality prediction of non-coding RNAs</article-title>. <source>Int. J. Mol. Sci.</source> <volume>22</volume>, <fpage>8719</fpage>. <pub-id pub-id-type="doi">10.3390/ijms22168719</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cui</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>LncRNADisease 2.0: an updated database of long non-coding RNA-associated diseases</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>D1034</fpage>&#x2013;<lpage>D1037</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky905</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barrett</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wilhite</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>Ledoux</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Evangelista</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>I. F.</given-names>
</name>
<name>
<surname>Tomashevsky</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>NCBI GEO: archive for functional genomics data sets--update</article-title>. <source>Nucleic Acids Res.</source> <volume>41</volume>, <fpage>D991</fpage>&#x2013;<lpage>D995</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gks1193</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bertone</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Stolc</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Royce</surname>
<given-names>T. E.</given-names>
</name>
<name>
<surname>Rozowsky</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Urban</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2004</year>). <article-title>Global identification of human transcribed sequences with genome tiling arrays</article-title>. <source>Science</source> <volume>306</volume>, <fpage>2242</fpage>&#x2013;<lpage>2246</lpage>. <pub-id pub-id-type="doi">10.1126/science.1103388</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brockdorff</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Ashworth</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kay</surname>
<given-names>G. F.</given-names>
</name>
<name>
<surname>McCabe</surname>
<given-names>V. M.</given-names>
</name>
<name>
<surname>Norris</surname>
<given-names>D. P.</given-names>
</name>
<name>
<surname>Cooper</surname>
<given-names>P. J.</given-names>
</name>
<etal/>
</person-group> (<year>1992</year>). <article-title>The product of the mouse Xist gene is a 15 kb inactive X-specific transcript containing no conserved ORF and located in the nucleus</article-title>. <source>Cell</source> <volume>71</volume>, <fpage>515</fpage>&#x2013;<lpage>526</lpage>. <pub-id pub-id-type="doi">10.1016/0092-8674(92)90519-i</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Hendrich</surname>
<given-names>B. D.</given-names>
</name>
<name>
<surname>Rupert</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Lafreni&#xe8;re</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Xing</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lawrence</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>1992</year>). <article-title>The human XIST gene: analysis of a 17 kb inactive X-specific RNA that contains conserved repeats and is highly localized within the nucleus</article-title>. <source>Cell</source> <volume>71</volume>, <fpage>527</fpage>&#x2013;<lpage>542</lpage>. <pub-id pub-id-type="doi">10.1016/0092-8674(92)90520-m</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Lafreniere</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Powers</surname>
<given-names>V. E.</given-names>
</name>
<name>
<surname>Sebastio</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Ballabio</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pettigrew</surname>
<given-names>A. L.</given-names>
</name>
<etal/>
</person-group> (<year>1991</year>). <article-title>Localization of the X inactivation centre on the human X chromosome in Xq13</article-title>. <source>Nature</source> <volume>349</volume>, <fpage>82</fpage>&#x2013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1038/349082a0</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cabili</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Dunagin</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>McClanahan</surname>
<given-names>P. D.</given-names>
</name>
<name>
<surname>Biaesch</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Padovan-Merhar</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Regev</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Localization and abundance analysis of human lncRNAs at single-cell and single-molecule resolution</article-title>. <source>Genome Biol.</source> <volume>16</volume>, <fpage>20</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-015-0586-4</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cai</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>GM-lncLoc: LncRNAs subcellular localization prediction based on graph neural network with meta-learning</article-title>. <source>BMC Genomics</source> <volume>24</volume>, <fpage>52</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-022-09034-1</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>H.-B.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>The lncLocator: a subcellular localization predictor for long non-coding RNAs based on a stacked ensemble classifier</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>2185</fpage>&#x2013;<lpage>2194</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty085</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carlevaro-Fita</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Rahim</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Guig&#xf3;</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Vardy</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Cytoplasmic long noncoding RNAs are frequently bound to and degraded at ribosomes in human cells</article-title>. <source>RNA</source> <volume>22</volume>, <fpage>867</fpage>&#x2013;<lpage>882</lpage>. <pub-id pub-id-type="doi">10.1261/rna.053561.115</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Brunner</surname>
<given-names>A.-D.</given-names>
</name>
<name>
<surname>Cogan</surname>
<given-names>J. Z.</given-names>
</name>
<name>
<surname>Nu&#xf1;ez</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Fields</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Adamson</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2020a</year>). <article-title>Pervasive functional translation of noncanonical human open reading frames</article-title>. <source>Science</source> <volume>367</volume>, <fpage>1140</fpage>&#x2013;<lpage>1146</lpage>. <pub-id pub-id-type="doi">10.1126/science.aay0262</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>K. H.</given-names>
</name>
<name>
<surname>Boettiger</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Moffitt</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhuang</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>RNA imaging. Spatially resolved, highly multiplexed RNA profiling in single cells</article-title>. <source>Science</source> <volume>348</volume>, <fpage>aaa6090</fpage>. <pub-id pub-id-type="doi">10.1126/science.aaa6090</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lei</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Nie</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2020b</year>). <article-title>CRISPR-Cas system for RNA detection and imaging</article-title>. <source>Chem. Res. Chin. Univ.</source> <volume>36</volume>, <fpage>157</fpage>&#x2013;<lpage>163</lpage>. <pub-id pub-id-type="doi">10.1007/s40242-019-0030-5</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cui</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Dou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ni</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>RNALocate v2.0: an updated resource for RNA subcellular localization with increased coverage and annotation</article-title>. <source>Nucleic Acids Res.</source> <volume>50</volume>, <fpage>D333</fpage>&#x2013;<lpage>D339</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkab825</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cunningham</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Allen</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Allen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Alvarez-Jarreta</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Amode</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Armean</surname>
<given-names>I. M.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Ensembl 2022</article-title>. <source>Nucleic Acids Res.</source> <volume>50</volume>, <fpage>D988</fpage>&#x2013;<lpage>D995</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkab1049</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Djebali</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Merkel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Dobin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lassmann</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Mortazavi</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Landscape of transcription in human cells</article-title>. <source>Nature</source> <volume>489</volume>, <fpage>101</fpage>&#x2013;<lpage>108</lpage>. <pub-id pub-id-type="doi">10.1038/nature11233</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dykes</surname>
<given-names>I. M.</given-names>
</name>
<name>
<surname>Emanueli</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Transcriptional and post-transcriptional gene regulation by long non-coding RNA</article-title>. <source>Genomics Proteomics Bioinforma.</source> <volume>15</volume>, <fpage>177</fpage>&#x2013;<lpage>186</lpage>. <pub-id pub-id-type="doi">10.1016/j.gpb.2016.12.005</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eng</surname>
<given-names>C.-H. L.</given-names>
</name>
<name>
<surname>Lawson</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Dries</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Koulena</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Takei</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Transcriptome-scale super-resolved imaging in tissues by RNA seqFISH&#x2b;</article-title>. <source>Nature</source> <volume>568</volume>, <fpage>235</fpage>&#x2013;<lpage>239</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-019-1049-y</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fagerberg</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Hallstr&#xf6;m</surname>
<given-names>B. M.</given-names>
</name>
<name>
<surname>Oksvold</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kampf</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Djureinovic</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Odeberg</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Analysis of the human tissue-specific expression by genome-wide integration of transcriptomics and antibody-based proteomics</article-title>. <source>Mol. Cell. Proteomics</source> <volume>13</volume>, <fpage>397</fpage>&#x2013;<lpage>406</lpage>. <pub-id pub-id-type="doi">10.1074/mcp.M113.035600</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>lncLocPred: predicting LncRNA subcellular localization using multiple sequence feature information</article-title>. <source>IEEE Access</source> <volume>8</volume>, <fpage>124702</fpage>&#x2013;<lpage>124711</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2020.3007317</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Femino</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Fay</surname>
<given-names>F. S.</given-names>
</name>
<name>
<surname>Fogarty</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Singer</surname>
<given-names>R. H.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Visualization of single RNA transcripts <italic>in situ</italic>
</article-title>. <source>Science</source> <volume>280</volume>, <fpage>585</fpage>&#x2013;<lpage>590</lpage>. <pub-id pub-id-type="doi">10.1126/science.280.5363.585</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Lv</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>LncLocation: efficient subcellular location prediction of long non-coding RNA-based multi-source heterogeneous feature fusion</article-title>. <source>Int. J. Mol. Sci.</source> <volume>21</volume>, <fpage>7271</fpage>. <pub-id pub-id-type="doi">10.3390/ijms21197271</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Frankish</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Diekhans</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>A.-M.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Jungreis</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Loveland</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>GENCODE reference annotation for the human and mouse genomes</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>D766</fpage>&#x2013;<lpage>D773</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky955</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Lnc2Cancer 3.0: an updated resource for experimentally supported lncRNA/circRNA cancer associations and web tools based on RNA-seq and scRNA-seq data</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>D1251</fpage>&#x2013;<lpage>D1258</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa1006</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gardini</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Global run-On sequencing (GRO-seq)</article-title>. <source>Methods Mol. Biol.</source> <volume>1468</volume>, <fpage>111</fpage>&#x2013;<lpage>120</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-4939-4035-6_9</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>German</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Schroth</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Meyers</surname>
<given-names>B. C.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>P. J.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Construction of Parallel Analysis of RNA Ends (PARE) libraries for the study of cleaved miRNA targets and the RNA degradome</article-title>. <source>Nat. Protoc.</source> <volume>4</volume>, <fpage>356</fpage>&#x2013;<lpage>362</lpage>. <pub-id pub-id-type="doi">10.1038/nprot.2009.8</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gudenas</surname>
<given-names>B. L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Prediction of LncRNA subcellular localization with deep learning from sequence features</article-title>. <source>Sci. Rep.</source> <volume>8</volume>, <fpage>16385</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-018-34708-w</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gyllborg</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Langseth</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Qian</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Salas</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Hilscher</surname>
<given-names>M. M.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Hybridization-based <italic>in situ</italic> sequencing (HybISS) for spatially resolved transcriptomics in human and mouse brain tissue</article-title>. <source>Nucleic Acids Res.</source> <volume>48</volume>, <fpage>e112</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa792</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hartford</surname>
<given-names>C. C. R.</given-names>
</name>
<name>
<surname>Lal</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>When long noncoding becomes protein coding</article-title>. <source>Mol. Cell. Biol.</source> <volume>40</volume>, <fpage>005288</fpage>&#x2013;<lpage>e611</lpage>. <pub-id pub-id-type="doi">10.1128/MCB.00528-19</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heinrich</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sidler</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Azzalin</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Weis</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Stem-loop RNA labeling can affect nuclear and cytoplasmic mRNA processing</article-title>. <source>RNA</source> <volume>23</volume>, <fpage>134</fpage>&#x2013;<lpage>141</lpage>. <pub-id pub-id-type="doi">10.1261/rna.057786.116</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hon</surname>
<given-names>C.-C.</given-names>
</name>
<name>
<surname>Ramilowski</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Harshbarger</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bertin</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Rackham</surname>
<given-names>O. J. L.</given-names>
</name>
<name>
<surname>Gough</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>An atlas of human long non-coding RNAs with accurate 5&#x2019; ends</article-title>. <source>Nature</source> <volume>543</volume>, <fpage>199</fpage>&#x2013;<lpage>204</lpage>. <pub-id pub-id-type="doi">10.1038/nature21374</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jeon</surname>
<given-names>Y.-J.</given-names>
</name>
<name>
<surname>Hasan</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>H. W.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>K. W.</given-names>
</name>
<name>
<surname>Manavalan</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>TACOS: a novel approach for accurate prediction of cell-specific long noncoding RNAs subcellular localization</article-title>. <source>Briefings Bioinforma.</source> <volume>23</volume>, <fpage>bbac243</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbac243</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaewsapsak</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Shechner</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Mallard</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Rinn</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Ting</surname>
<given-names>A. Y.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Live-cell mapping of organelle-associated RNAs via proximity biotinylation combined with protein-RNA crosslinking</article-title>. <source>Elife</source> <volume>6</volume>, <fpage>e29224</fpage>. <pub-id pub-id-type="doi">10.7554/elife.29224</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Keene</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Komisarow</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Friedersdorf</surname>
<given-names>M. B.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>RIP-Chip: the isolation and identification of mRNAs, microRNAs and protein components of ribonucleoprotein complexes from cell extracts</article-title>. <source>Nat. Protoc.</source> <volume>1</volume>, <fpage>302</fpage>&#x2013;<lpage>307</lpage>. <pub-id pub-id-type="doi">10.1038/nprot.2006.47</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kishi</surname>
<given-names>J. Y.</given-names>
</name>
<name>
<surname>Lapan</surname>
<given-names>S. W.</given-names>
</name>
<name>
<surname>Beliveau</surname>
<given-names>B. J.</given-names>
</name>
<name>
<surname>West</surname>
<given-names>E. R.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sasaki</surname>
<given-names>H. M.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>SABER amplifies FISH: enhanced multiplexed imaging of RNA and DNA in cells and tissues</article-title>. <source>Nat. Methods</source> <volume>16</volume>, <fpage>533</fpage>&#x2013;<lpage>544</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-019-0404-0</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Daugharthy</surname>
<given-names>E. R.</given-names>
</name>
<name>
<surname>Scheiman</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kalhor</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ferrante</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Terry</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Fluorescent <italic>in situ</italic> sequencing (FISSEQ) of RNA for gene expression profiling in intact cells and tissues</article-title>. <source>Nat. Protoc.</source> <volume>10</volume>, <fpage>442</fpage>&#x2013;<lpage>458</lpage>. <pub-id pub-id-type="doi">10.1038/nprot.2014.191</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Levesque</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Ginart</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Raj</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Visualizing SNVs to quantify allele-specific expression in single cells</article-title>. <source>Nat. Methods</source> <volume>10</volume>, <fpage>865</fpage>&#x2013;<lpage>867</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.2589</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Roebuck</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Diao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yuan</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>TANRIC: an interactive open platform to explore the function of lncRNAs in cancer</article-title>. <source>Cancer Res.</source> <volume>75</volume>, <fpage>3728</fpage>&#x2013;<lpage>3737</lpage>. <pub-id pub-id-type="doi">10.1158/0008-5472.CAN-15-0273</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2023a</year>). <article-title>GraphLncLoc: long non-coding RNA subcellular localization prediction using graph convolutional networks based on sequence to graph transformation</article-title>. <source>Briefings Bioinforma.</source> <volume>24</volume>, <fpage>bbac565</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbac565</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2023b</year>). <article-title>LncBook 2.0: integrating human long non-coding RNAs with multi-omics annotations</article-title>. <source>Nucleic Acids Res.</source> <volume>51</volume>, <fpage>D186</fpage>&#x2013;<lpage>D191</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkac999</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>LncExpDB: an expression database of human long non-coding RNAs</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>D962</fpage>&#x2013;<lpage>D968</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa850</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>H.-B.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>lncLocator 2.0: a cell-line-specific subcellular localization predictor for long non-coding RNAs with interpretable deep learning</article-title>. <source>Bioinformatics</source> <volume>37</volume>, <fpage>2308</fpage>&#x2013;<lpage>2316</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btab127</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lorenzi</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chiu</surname>
<given-names>H.-S.</given-names>
</name>
<name>
<surname>Avila Cobos</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Gross</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Volders</surname>
<given-names>P.-J.</given-names>
</name>
<name>
<surname>Cannoodt</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>The RNA Atlas expands the catalog of human non-coding RNAs</article-title>. <source>Nat. Biotechnol.</source> <volume>39</volume>, <fpage>1453</fpage>&#x2013;<lpage>1465</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-021-00936-1</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lubeck</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Single-cell systems biology by super-resolution imaging and combinatorial labeling</article-title>. <source>Nat. Methods</source> <volume>9</volume>, <fpage>743</fpage>&#x2013;<lpage>748</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.2069</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hitz</surname>
<given-names>B. C.</given-names>
</name>
<name>
<surname>Gabdank</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Hilton</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Kagda</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Lam</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>New developments on the Encyclopedia of DNA Elements (ENCODE) data portal</article-title>. <source>Nucleic Acids Res.</source> <volume>48</volume>, <fpage>D882</fpage>&#x2013;<lpage>D889</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz1062</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mas-Ponte</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Carlevaro-Fita</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Palumbo</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Hermoso Pulido</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Guigo</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>LncATLAS database for subcellular localization of long noncoding RNAs</article-title>. <source>RNA</source> <volume>23</volume>, <fpage>1080</fpage>&#x2013;<lpage>1087</lpage>. <pub-id pub-id-type="doi">10.1261/rna.060814.117</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mellis</surname>
<given-names>I. A.</given-names>
</name>
<name>
<surname>Gupte</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Raj</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rouhanifard</surname>
<given-names>S. H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Visualizing adenosine-to-inosine RNA editing in single mammalian cells</article-title>. <source>Nat. Methods</source> <volume>14</volume>, <fpage>801</fpage>&#x2013;<lpage>804</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4332</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pelechano</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Steinmetz</surname>
<given-names>L. M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Extensive transcriptional heterogeneity revealed by isoform profiling</article-title>. <source>Nature</source> <volume>497</volume>, <fpage>127</fpage>&#x2013;<lpage>131</lpage>. <pub-id pub-id-type="doi">10.1038/nature12121</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pertea</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Shumate</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pertea</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Varabyou</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Breitwieser</surname>
<given-names>F. P.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>Y.-C.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>CHESS: a new human gene catalog curated from thousands of large-scale RNA sequencing experiments reveals extensive transcriptional noise</article-title>. <source>Genome Biol.</source> <volume>19</volume>, <fpage>208</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-018-1590-2</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pisignano</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Ladomery</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Epigenetic regulation of alternative splicing: how LncRNAs tailor the message</article-title>. <source>Noncoding RNA</source> <volume>7</volume>, <fpage>21</fpage>. <pub-id pub-id-type="doi">10.3390/ncrna7010021</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raj</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tyagi</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Detection of individual endogenous RNA transcripts <italic>in situ</italic> using multiple singly labeled probes</article-title>. <source>Methods Enzym.</source> <volume>472</volume>, <fpage>365</fpage>&#x2013;<lpage>386</lpage>. <pub-id pub-id-type="doi">10.1016/S0076-6879(10)72004-8</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Romero-Barrios</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Legascue</surname>
<given-names>M. F.</given-names>
</name>
<name>
<surname>Benhamed</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ariel</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Crespi</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Splicing regulation by long noncoding RNAs</article-title>. <source>Nucleic Acids Res.</source> <volume>46</volume>, <fpage>2169</fpage>&#x2013;<lpage>2184</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky095</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rouhanifard</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Mellis</surname>
<given-names>I. A.</given-names>
</name>
<name>
<surname>Dunagin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bayatpour</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Dardani</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>ClampFISH detects individual nucleic acid molecules using click chemistry-based amplification</article-title>. <source>Nat. Biotechnol.</source> <volume>37</volume>, <fpage>84</fpage>&#x2013;<lpage>89</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.4286</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Savulescu</surname>
<given-names>A. F.</given-names>
</name>
<name>
<surname>Bouilhol</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Beaume</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Nikolski</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Prediction of RNA subcellular localization: learning from heterogeneous data sources</article-title>. <source>iScience</source> <volume>24</volume>, <fpage>103298</fpage>. <pub-id pub-id-type="doi">10.1016/j.isci.2021.103298</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sayers</surname>
<given-names>E. W.</given-names>
</name>
<name>
<surname>Bolton</surname>
<given-names>E. E.</given-names>
</name>
<name>
<surname>Brister</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Canese</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Chan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Comeau</surname>
<given-names>D. C.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Database resources of the national center for biotechnology information</article-title>. <source>Nucleic Acids Res.</source> <volume>50</volume>, <fpage>D20</fpage>&#x2013;<lpage>D26</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkab1112</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schena</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Shalon</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>R. W.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>P. O.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Quantitative monitoring of gene expression patterns with a complementary DNA microarray</article-title>. <source>Science</source> <volume>270</volume>, <fpage>467</fpage>&#x2013;<lpage>470</lpage>. <pub-id pub-id-type="doi">10.1126/science.270.5235.467</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shiraki</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Kondo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Katayama</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Waki</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kasukawa</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Kawaji</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2003</year>). <article-title>Cap analysis gene expression for high-throughput analysis of transcriptional starting point and identification of promoter usage</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>100</volume>, <fpage>15776</fpage>&#x2013;<lpage>15781</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.2136655100</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smola</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Rice</surname>
<given-names>G. M.</given-names>
</name>
<name>
<surname>Busan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Siegfried</surname>
<given-names>N. A.</given-names>
</name>
<name>
<surname>Weeks</surname>
<given-names>K. M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Selective 2&#x2019;-hydroxyl acylation analyzed by primer extension and mutational profiling (SHAPE-MaP) for direct, versatile and accurate RNA structure analysis</article-title>. <source>Nat. Protoc.</source> <volume>10</volume>, <fpage>1643</fpage>&#x2013;<lpage>1669</lpage>. <pub-id pub-id-type="doi">10.1038/nprot.2015.103</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Statello</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>C.-J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.-L.</given-names>
</name>
<name>
<surname>Huarte</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Gene regulation by long non-coding RNAs and its biological functions</article-title>. <source>Nat. Rev. Mol. Cell Biol.</source> <volume>22</volume>, <fpage>96</fpage>&#x2013;<lpage>118</lpage>. <pub-id pub-id-type="doi">10.1038/s41580-020-00315-9</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname>
<given-names>Z.-D.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.-Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y.-W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>iLoc-lncRNA: predict the subcellular location of lncRNAs by incorporating octamer composition into general PseKNC</article-title>. <source>Bioinforma. Oxf. Engl.</source> <volume>34</volume>, <fpage>4196</fpage>&#x2013;<lpage>4204</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty508</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sweeney</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Petrov</surname>
<given-names>A. I.</given-names>
</name>
<name>
<surname>Ribas</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Finn</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Bateman</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Szymanski</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>RNAcentral 2021: secondary structure integration, improved sequence search and new member databases</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>D212</fpage>&#x2013;<lpage>D220</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa921</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Symmons</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mellis</surname>
<given-names>I. A.</given-names>
</name>
<name>
<surname>Kalish</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Suszt&#xe1;k</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Allele-specific RNA imaging shows that allelic imbalances can arise in tissues through transcriptional bursting</article-title>. <source>PLoS Genet.</source> <volume>15</volume>, <fpage>e1007874</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1007874</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Szcze&#x15b;niak</surname>
<given-names>M. W.</given-names>
</name>
<name>
<surname>Bryzghalov</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Ciomborowska-Basheer</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Maka&#x142;owska</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>CANTATAdb 2.0: expanding the collection of plant long noncoding RNAs</article-title>. <source>Methods Mol. Biol.</source> <volume>1933</volume>, <fpage>415</fpage>&#x2013;<lpage>429</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-4939-9045-0_26</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<collab>The ENCODE Project Consortium</collab> (<year>2012</year>). <article-title>An integrated encyclopedia of DNA elements in the human genome</article-title>. <source>Nature</source> <volume>489</volume>, <fpage>57</fpage>&#x2013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.1038/nature11247</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tilgner</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Knowles</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Chakrabortty</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Djebali</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Deep sequencing of subcellular RNA fractions shows splicing to be predominantly co-transcriptional in the human genome but inefficient for lncRNAs</article-title>. <source>Genome Res.</source> <volume>22</volume>, <fpage>1616</fpage>&#x2013;<lpage>1625</lpage>. <pub-id pub-id-type="doi">10.1101/gr.134445.111</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tsanov</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Samacoits</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chouaib</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Traboulsi</surname>
<given-names>A.-M.</given-names>
</name>
<name>
<surname>Gostan</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Weber</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>smiFISH and FISH-quant - a flexible single RNA detection approach with super-resolution capability</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume>, <fpage>e165</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw784</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Velculescu</surname>
<given-names>V. E.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Vogelstein</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Kinzler</surname>
<given-names>K. W.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Serial analysis of gene expression</article-title>. <source>Science</source> <volume>270</volume>, <fpage>484</fpage>&#x2013;<lpage>487</lpage>. <pub-id pub-id-type="doi">10.1126/science.270.5235.484</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Volders</surname>
<given-names>P.-J.</given-names>
</name>
<name>
<surname>Anckaert</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Verheggen</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Nuytens</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Martens</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Mestdagh</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>LNCipedia 5: towards a reference set of human long non-coding RNAs</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>D135</fpage>&#x2013;<lpage>D139</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky1031</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Qu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Ouyang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>H. Y.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Genome-wide mapping of RNA structure using nuclease digestion and high-throughput sequencing</article-title>. <source>Nat. Protoc.</source> <volume>8</volume>, <fpage>849</fpage>&#x2013;<lpage>869</lpage>. <pub-id pub-id-type="doi">10.1038/nprot.2013.045</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2021a</year>). <article-title>DM3Loc: multi-label mRNA subcellular localization prediction and analysis based on multi-head self-attention mechanism</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>e46</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkab016</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2021b</year>). &#x201c;<article-title>A review on predicting subcellular localization of lncRNA</article-title>,&#x201d; in <source>2021 13th international conference on intelligent human-machine systems and cybernetics (IHMSC)</source> (<publisher-name>IEEE</publisher-name>). <pub-id pub-id-type="doi">10.1109/ihmsc52134.2021.00043</pub-id>
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Allen</surname>
<given-names>W. E.</given-names>
</name>
<name>
<surname>Wright</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Sylwestrak</surname>
<given-names>E. L.</given-names>
</name>
<name>
<surname>Samusik</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Vesuna</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Three-dimensional intact-tissue sequencing of single-cell transcriptional states</article-title>. <source>Science</source> <volume>361</volume>, <fpage>eaat5691</fpage>. <pub-id pub-id-type="doi">10.1126/science.aat5691</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Gerstein</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Snyder</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>RNA-Seq: a revolutionary tool for transcriptomics</article-title>. <source>Nat. Rev. Genet.</source> <volume>10</volume>, <fpage>57</fpage>&#x2013;<lpage>63</lpage>. <pub-id pub-id-type="doi">10.1038/nrg2484</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>L.-H.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>J. U.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Coding functions of &#x201c;noncoding&#x201d; RNAs</article-title>. <source>Science</source> <volume>367</volume>, <fpage>1074</fpage>&#x2013;<lpage>1075</lpage>. <pub-id pub-id-type="doi">10.1126/science.aba6117</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>lncSLdb: a resource for long non-coding RNA subcellular localization</article-title>. <source>Database (Oxford)</source> <volume>2018</volume>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1093/database/bay085</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xia</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Emanuel</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Hao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhuang</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Spatial transcriptome profiling by MERFISH reveals subcellular RNA compartmentalization and cell cycle-dependent gene expression</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>116</volume>, <fpage>19490</fpage>&#x2013;<lpage>19499</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1912459116</pub-id>
</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>X.-F.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.-K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>P.-F.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Predicting LncRNA subcellular localization using unbalanced pseudo-k nucleotide compositions</article-title>. <source>Curr. Bioinforma.</source> <volume>15</volume>, <fpage>554</fpage>&#x2013;<lpage>562</lpage>. <pub-id pub-id-type="doi">10.2174/1574893614666190902151038</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zeng</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>F.-X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>DeepLncLoc: a deep learning framework for long non-coding RNA subcellular localization prediction based on subsequence embedding</article-title>. <source>Briefings Bioinforma.</source> <volume>23</volume>, <fpage>bbab360</fpage>. <pub-id pub-id-type="doi">10.1093/bib/bbab360</pub-id>
</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Qiao</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>KD-KLNMF: identification of lncRNAs subcellular localization with multiple features and nonnegative matrix factorization</article-title>. <source>Anal. Biochem.</source> <volume>610</volume>, <fpage>113995</fpage>. <pub-id pub-id-type="doi">10.1016/j.ab.2020.113995</pub-id>
</citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>RNALocate: a resource for RNA subcellular localizations</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <fpage>D135</fpage>&#x2013;<lpage>D138</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw728</pub-id>
</citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Z.-Y.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.-H.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Design powerful predictor for mRNA subcellular location prediction in <italic>Homo sapiens</italic>
</article-title>. <source>Briefings Bioinforma.</source> <volume>22</volume>, <fpage>526</fpage>&#x2013;<lpage>535</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbz177</pub-id>
</citation>
</ref>
<ref id="B86">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>NONCODEV6: an updated database dedicated to long non-coding RNA annotation in both animals and plants</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>D165</fpage>&#x2013;<lpage>D171</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa1046</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>