<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="discussion" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<?covid-19-tdm?>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Big Data</journal-id>
<journal-title>Frontiers in Big Data</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Big Data</abbrev-journal-title>
<issn pub-type="epub">2624-909X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">656553</article-id>
<article-id pub-id-type="doi">10.3389/fdata.2021.656553</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Big Data</subject>
<subj-group>
<subject>Opinion</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Towards Machine-Readable (Meta) Data and the FAIR Value for Artificial Intelligence Exploration of COVID-19 and Cancer Research Data</article-title>
<alt-title alt-title-type="left-running-head">Campos et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Machine-Readable (Meta)Data, FAIR and AI</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Campos</surname>
<given-names>Maria Luiza. M.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1317147/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Silva</surname>
<given-names>Eug&#xea;nio</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1318535/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cerceau</surname>
<given-names>Renato</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1185101/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cruz</surname>
<given-names>S&#xe9;rgio Manuel Serra da</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1042331/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Silva</surname>
<given-names>Fabricio A. B.</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/618982/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gouveia</surname>
<given-names>F&#xe1;bio. C.</given-names>
</name>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/787354/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jardim</surname>
<given-names>Rodrigo</given-names>
</name>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1344584/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kotowski</surname>
<given-names>Nelson</given-names>
</name>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1305742/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lopes</surname>
<given-names>Giseli Rabello</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1436609/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>D&#xe1;vila</surname>
<given-names>Alberto. M. R.</given-names>
</name>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/301269/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Instituto de Computa&#x00E7;&#x00E3;o, Universidade Federal do Rio de Janeiro, UFRJ, <addr-line>Rio de Janeiro</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>Unidade de Computa&#x00E7;&#x00E3;o (Ucomp), Centro Universitario Estadual da Zona Oeste (UEZO), <addr-line>Rio de Janeiro</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff3">
<label>
<sup>3</sup>
</label>Instituto Nacional de Cardiologia, INC, <addr-line>Rio de Janeiro</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff4">
<label>
<sup>4</sup>
</label>Universidade do Estado do Rio de Janeiro, UERJ, <addr-line>Rio de Janeiro</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff5">
<label>
<sup>5</sup>
</label>Departamento de Ci&#x00EA;ncias da Computa&#x00E7;&#x00E3;o, Universidade Federal Rural do Rio de Janeiro, UFRRJ, <addr-line>Serop&#xe9;dica</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff6">
<label>
<sup>6</sup>
</label>PROCC, FIOCRUZ, <addr-line>Rio de Janeiro</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff7">
<label>
<sup>7</sup>
</label>Casa de Oswaldo Cruz, FIOCRUZ, <addr-line>Rio de Janeiro</addr-line>, <country>Brazil</country>
</aff>
<aff id="aff8">
<label>
<sup>8</sup>
</label>Laborat&#x00F3;rio de Biologia Computacional e Sistemas, Instituto Oswaldo Cruz, FIOCRUZ, <addr-line>Rio de Janeiro</addr-line>, <country>Brazil</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/569637/overview">Ruchir Shah</ext-link>, Sciome LLC, United&#x20;States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/481771/overview">Akram Mohammed</ext-link>, University of Tennessee Health Science Center (UTHSC), United&#x20;States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1028642/overview">Arpit Tandon</ext-link>, Sciome LLC, United&#x20;States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Alberto. M. R. D&#xe1;vila, <email>alberto.davila@fiocruz.br</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Medicine and Public Health, a section of the journal Frontiers in Big&#x20;Data</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>30</day>
<month>08</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>4</volume>
<elocation-id>656553</elocation-id>
<history>
<date date-type="received">
<day>21</day>
<month>01</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>14</day>
<month>07</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Campos, Silva, Cerceau, Cruz, Silva, Gouveia, Jardim, Kotowski, Lopes and D&#xe1;vila.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Campos, Silva, Cerceau, Cruz, Silva, Gouveia, Jardim, Kotowski, Lopes and D&#xe1;vila</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<kwd-group>
<kwd>COVID-19</kwd>
<kwd>Findable, Accessible, Interoperable, and Reusable</kwd>
<kwd>cancer</kwd>
<kwd>metadata</kwd>
<kwd>artificial intelligence</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>State of the Art</title>
<p>Even before COVID-19, the bioinformatics labs and life science industry were investing extensively in ecosystems of technological and analytical applications/appliances to store, curate, share, integrate, and analyze large amounts of data. With the pandemic coming at an accelerating pace, a series of global research actions are being implemented to strive against&#x20;the virus and its effects and to create data-driven investigations to support more&#x20;agile responses to future events<xref ref-type="fn" rid="FN1">
<sup>1</sup>
</xref>. Innovative solutions in COVID-19 research require more efficient and effective data management strategies and practices. Cancer research is an excellent example of the adoption of the FAIR (Findable, Accessible, Interoperable, and Reusable) data principles (<xref ref-type="bibr" rid="B20">Wilkinson et&#x20;al., 2016</xref>) on precision oncology (<xref ref-type="bibr" rid="B5">Deist et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B6">Delgado and Llorente, 2020</xref>; <xref ref-type="bibr" rid="B18">Vesteghem et&#x20;al., 2020</xref>) and major cancer data repositories, such as the NIH Cancer Research Data Commons, are gradually adhering to these principles.</p>
<p>In a broad sense, understanding the whole scenario of a worldwide virus outbreak such as the COVID-19 pandemic has been a great challenge. It involves a huge effort to put together facts and a large volume of data related to the dynamics of the real world, as well as past and current results of scientific research. At the same time, cancer researchers are pivoting portions of their investigations and contributing with their expertise and resources to scientific studies of the SARS-Cov-2. Their findings have been wide in scope, ranging from insights to researching how the virus enters cells to identify potential therapies (<xref ref-type="bibr" rid="B12">NCI Staff, 2021</xref>).</p>
<p>Today, researchers are running against the clock to face at least three barriers to run data-driven investigations. First, data specialists refer to the fact that approximately 80% of researchers&#x2019; time is spent finding, cleaning, and organizing data (<xref ref-type="bibr" rid="B14">Schrage, 2017</xref>; <xref ref-type="bibr" rid="B17">Tyagi, 2020</xref>). Second, the availability of research data declines quite rapidly as articles age (<xref ref-type="bibr" rid="B11">Miyakawa, 2020</xref>). Third, raw data supporting the scientific results or proper descriptions of data repositories (<xref ref-type="bibr" rid="B19">Vines et&#x20;al., 2014)</xref> are lacking in many investigations and articles. These barriers may hinder innovation and scientific development because they increase the so-called &#x201c;reproducibility crisis&#x201d; of scientific experiments. Hence, to circumvent such shortcomings and optimize researchers&#x2019; efforts and time, some research organizations (like the Research Data Alliance<xref ref-type="fn" rid="FN2">
<sup>2</sup>
</xref>, World Data Systems<xref ref-type="fn" rid="FN3">
<sup>3</sup>
</xref>, GO FAIR<xref ref-type="fn" rid="FN4">
<sup>4</sup>
</xref>, etc.) are discussing how data initiatives can be properly incorporated into the life cycle of data-driven experiments, aiming to increase preservation, and sharing and reuse of&#x20;data.</p>
</sec>
<sec id="s2">
<title>COVID-19 and Lessons Learned From Cancer Research</title>
<p>The explosion of biomedical big data has considerably changed the landscape of cancer research. Researchers are used to dealing with complex biological problems and carrying out heterogeneous data-driven investigations (<xref ref-type="bibr" rid="B13">Schade et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B1">Bailey et&#x20;al., 2020</xref>). It is a consensus that single research centers cannot produce enough data to fit prognostic and predictive models of sufficient accuracy. Hence, data integration in precision oncology is of great relevance (<xref ref-type="bibr" rid="B12">NCI Staff, 2021</xref>).</p>
<p>Nowadays, large-scale COVID-19 and precision oncology projects face several challenges (<xref ref-type="bibr" rid="B4">Budin-Lj&#xf8;sne et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B2">Bertier et&#x20;al., 2016</xref>). Some issues lie in the ways data are recorded, stored, and reused. In addition, various health-care systems are incompatible, making it difficult, expensive, and time-consuming to aggregate datasets from different sources due to the diversity of data involved and poor data management (<xref ref-type="bibr" rid="B18">Vesteghem et&#x20;al., 2020</xref>).</p>
<p>Even before the coronavirus pandemic, various European cancer initiatives have emerged to tackle these issues by standardizing and facilitating data pipelines. Several groups are implementing the FAIR data principles, fostering the use of standards, common metadata models, and ontologies to increase the interoperability and reusability of data in oncology projects (<xref ref-type="bibr" rid="B10">Mart&#xed;nez-Garc&#xed;a et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B22">Zong et&#x20;al., 2020</xref>).</p>
<p>Data stewardship is an essential driver of cancer research groups and clinical practice. Since 2016, the FAIR data principles have been resonating in scientific health communities. Enabling data to be FAIR is currently believed to strengthen data sharing, reduce duplicated efforts, make them more findable by machines, and harmonize data from heterogeneous unconnected data silos. These lessons learned by cancer researchers can minimize future health emergencies and humanitarian crises in all countries regarding COVID-19.</p>
</sec>
<sec id="s3">
<title>The COVID-19 Case and FAIR Initiatives</title>
<p>The FAIR guiding principles (<xref ref-type="bibr" rid="B20">Wilkinson et&#x20;al., 2016)</xref> were created to save researchers&#x2019; time and help maximize the impact of health data. The principles began in a few European academic institutions and have burgeoned to include endorsements by global organizations such as the Group of Seven (G7) intergovernmental organization, science funding agencies, and national governments. They are a fundamental enabler of digital transformation and data interoperability in data-driven computing applications. These principles aim to enhance the ability of machines to automatically find and use (meta)data (<xref ref-type="bibr" rid="B8">Heath and Bizer, 2011</xref>).</p>
<p>Several challenges are related to the discovery, access, and interoperability of data from different sources. Before the FAIR principles were proposed, a set of principles and technologies, known as Linked Data, used the Web infrastructure to enable data sharing and reuse on a massive scale (<xref ref-type="bibr" rid="B3">Bizer et&#x20;al., 2009</xref>), creating the Web of Data. The Linked Data principles (<xref ref-type="bibr" rid="B15">Semantic</xref>) are a set of best practices for publishing structured data on the Web, including the following: (i) to use URIs (Uniform Resource Identifiers) as names for things; (ii) to use HTTP URIs so that people can look up those names; (iii) when someone looks up a URI, to provide useful information, using standards like RDF and SPARQL; and (iv) to include links to other URIs so that more resources can be discovered. It is also essential to highlight the need to use controlled vocabularies and ontologies as well as establishing interlinks for proper exploration of the Web of&#x20;Data.</p>
<p>The FAIR principles are focused on research data and are not limited to specific technologies, but they can benefit from Linked Data technologies. FAIR also includes a stated license for access, not addressed by the open nature of Linked Data (<xref ref-type="bibr" rid="B8">Heath and Bizer, 2011</xref>). In this sense, the FAIR Data Point was inspired by the Linked Data platform but targets its development more explicitly related to the FAIR principles (<xref ref-type="bibr" rid="B20">Wilkinson et&#x20;al., 2016</xref>). A FAIR Data Point stores information about the datasets, that is, metadata, both human and machine-readable.</p>
<p>The preparation of data to properly interoperate and be reused can be improved dramatically by implementing the FAIR data principles for scientific data management. Thus, many powerful analytical tools such as machine learning algorithms and artificial intelligence (AI) packages will automatically access the data from which they learn and extract new knowledge. Moreover, in previous stages, machine learning, AI, and data mining techniques can&#x20;also be instrumental: (i) in the step of data&#x20;preparation, for example, helping to transform&#x20;nonstructured data for the publication as structured data, following the Linked Data principles; (ii) in other steps, as in discovering vocabularies and ontologies to annotate the (meta)data or in identifying new datasets for interlinkages.</p>
<p>Thus, the FAIR principles and associated infrastructure can undoubtedly contribute to creating a federated network of data distribution associated with different aspects of the COVID-19 pandemic as well as cancer research. The ideas proposed by the GO FAIR initiative received unprecedented attention. They were endorsed by research data communities that valued the contribution of the GO FAIR movement in putting a lot of emphasis on (meta)data publishing protocols, semantic support, and machine actionable elements.</p>
<p>At the beginning of 2020, the Virus Outbreak Data Network (VODAN)<xref ref-type="fn" rid="FN5">
<sup>5</sup>
</xref> was conceived as an implementation network collaboratively developed to support the capture and use of data, following the FAIR data principles, not only during this pandemic but also on future infectious disease outbreaks. The network serves both human and machine exploration, fostering the reuse and reproducibility of scientific resources. The seed of the VODAN BR project<xref ref-type="fn" rid="FN6">
<sup>6</sup>
</xref> started to implement one of the network data points, with pilot collaboration, collecting, and treating anonymized patients&#x2019; data from COVID-19 cases of two public hospitals, following the World Health Organization standard&#x20;form.</p>
<p>The VODAN BR project started at the beginning of the Brazilian COVID-19 outbreak. The primary goals were to understand the value of FAIR data management through the appropriate education and training of several researchers and health staff, combined with the necessary cultural change motivation. After that, the technological infrastructure to support the FAIR data life cycle was developed and is still under improvement.</p>
<p>Through the so-called FAIRification process, both data and metadata become machine-processable, receive permanent identifiers, and are associated with vocabularies and ontologies to reduce ambiguity. The data licensing scheme may vary from allowing complete open access to more restricted access for research partners only. The metadata, on the other hand, are published in federated FAIR Data Points for open access, and, more importantly, as metadata for the machine (M4M)<xref ref-type="fn" rid="FN7">
<sup>7</sup>
</xref> to be automatically processed or human consumed.</p>
<p>Our general goals are aligned with global efforts developed by the pharmaceutical industry, and other life sciences R and D such as biomedicine, environmental sciences, agriculture, and food production. For instance, there are several successful cases in the big pharma industry. AstraZeneca intensified the use of identifiers to find and access internal data. Roche, Bayer, and SciBite demonstrated the value of interoperability through linked (meta)data (<xref ref-type="bibr" rid="B7">Hasnain et&#x20;al., 2018</xref>). Nevertheless, the major value of FAIR data to the VODAN BR project and any other organization is the larger reusability beyond the initial and primary purpose of the datasets (<xref ref-type="bibr" rid="B21">Wise et&#x20;al., 2019</xref>).</p>
<p>The FAIRification process enables us to achieve more value from internal and external data over a greater period. The associated linked provenance and general metadata are expected to persist as a permanent scientific record, even when the original data have lost value and have been archived or eventually deleted as a part of the FAIR data management life&#x20;cycle.</p>
<p>In the present pandemic scenario, actions that can amplify data sharing, and globally contribute to research&#x20;development&#x2014;with carefully defined levels of openness to protect sensitive data&#x2014;are key for generating rapid and coordinated responses from science. Briefly, VODAN BR is one of these efforts, dealing with the challenges of establishing a distributed infrastructure to harvest COVID-19 semantic (meta)data. It starts by addressing patients&#x2019; data and is then expected to evolve by effectively supporting interoperability with many other distributed datasets using artificial intelligence, machine learning, and data science algorithms to assist health teams and public managers in making better data-driven decisions.</p>
<p>Last but not least, considering that data from omics sciences are produced at an unprecedented speed and volume, surpassed only by data produced by astronomers (<xref ref-type="bibr" rid="B16">Stephens et&#x20;al., 2015</xref>), adopting the FAIR principles is undoubtedly critical to support genomic-based research and discoveries globally.</p>
</sec>
</body>
<back>
<sec id="s4">
<title>Author Contributions</title>
<p>All authors listed have made a substantial, direct, and intellectual contribution to the work and approved it for publication.</p>
</sec>
<sec sec-type="COI-statement" id="s5">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s6">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<fn-group>
<fn id="FN1">
<label>1</label>
<p>Establishing a FAIR Biomedical Data Ecosystem: The Role of Generalist Repositories to Enhance Data Discoverability and Reuse Workshop. February 11, 2020&#x2013;February 12, 2020&#x2013;NIH Main Campus (<ext-link ext-link-type="uri" xlink:href="https://datascience.cancer.gov/news-events/events/establishing-fair-biomedical-data-ecosystem-role-generalist-repositories-enhance">https://datascience.cancer.gov/news-events/events/establishing-fair-biomedical-data-ecosystem-role-generalist-repositories-enhance</ext-link>).</p>
</fn>
<fn id="FN2">
<label>2</label>
<p>
<ext-link ext-link-type="uri" xlink:href="%20https://www.rd-alliance.org/">https://www.rd-alliance.org/</ext-link>
</p>
</fn>
<fn id="FN3">
<label>3</label>
<p>
<ext-link ext-link-type="uri" xlink:href="%20https://www.worlddatasystem.org/">https://www.worlddatasystem.org/</ext-link>
</p>
</fn>
<fn id="FN4">
<label>4</label>
<p>
<ext-link ext-link-type="uri" xlink:href="%20https://www.go-fair.org/">https://www.go-fair.org/</ext-link>
</p>
</fn>
<fn id="FN5">
<label>5</label>
<p>
<ext-link ext-link-type="uri" xlink:href="%20https://www.go-fair.org/implementation-networks/overview/vodan/">https://www.go-fair.org/implementation-networks/overview/vodan/</ext-link>
</p>
</fn>
<fn id="FN6">
<label>6</label>
<p>
<ext-link ext-link-type="uri" xlink:href="%20https://vodanbr.github.io/">https://vodanbr.github.io/</ext-link>
</p>
</fn>
<fn id="FN7">
<label>7</label>
<p>
<ext-link ext-link-type="uri" xlink:href="%20https://www.go-fair.org/how-to-go-fair/metadata-for-machines/">https://www.go-fair.org/how-to-go-fair/metadata-for-machines/</ext-link>
</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bailey</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Black</surname>
<given-names>J.&#x20;R. M.</given-names>
</name>
<name>
<surname>Swanton</surname>
<given-names>C.</given-names>
</name>
</person-group>
<collab>, and Cancer Research</collab> (<year>2020</year>). <article-title>Cancer Research: The Lessons to Learn from COVID-19</article-title>. <source>Cancer Discov.</source> <volume>10</volume> (<issue>9</issue>), <fpage>1263</fpage>&#x2013;<lpage>1266</lpage>. <pub-id pub-id-type="doi">10.1158/2159-8290.CD-20-0823</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bertier</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Carrot-Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ragoussis</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Joly</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Integrating Precision Cancer Medicine into Healthcare&#x2014;Policy, Practice, and Research Challenges</article-title>. <source>Genome Med.</source> <volume>8</volume> (<issue>1</issue>), <fpage>108</fpage>. <pub-id pub-id-type="doi">10.1186/s13073-016-0362-4</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bizer</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Heath</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Berners-Lee</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Linked Data - the Story So Far</article-title>. <source>Int</source>. </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Budin-Lj&#xf8;sne</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Isaeva</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Knoppers</surname>
<given-names>B. M.</given-names>
</name>
<name>
<surname>Tass&#xe9;</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>H. Y.</given-names>
</name>
<name>
<surname>McCarthy</surname>
<given-names>M. I.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Data Sharing in Large Research Consortia: Experiences and Recommendations from ENGAGE</article-title>. <source>Eur. J.&#x20;Hum. Genet.</source> <volume>22</volume> (<issue>3</issue>), <fpage>317</fpage>&#x2013;<lpage>321</lpage>. <pub-id pub-id-type="doi">10.1038/ejhg.2013.131</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deist</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>Dankers</surname>
<given-names>F. J.&#x20;W. M.</given-names>
</name>
<name>
<surname>Ojha</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Scott Marshall</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Janssen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Faivre-Finn</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Distributed Learning on 20&#x20;000&#x2b; Lung Cancer Patients - the Personal Health Train</article-title>. <source>Radiother. Oncol.</source> <volume>144</volume>, <fpage>189</fpage>&#x2013;<lpage>200</lpage>. <comment>Available from: <ext-link ext-link-type="uri" xlink:href="https://www.sciencedirect.com/science/article/pii/S0167814019334899">https://www.sciencedirect.com/science/article/pii/S0167814019334899</ext-link>
</comment>. <pub-id pub-id-type="doi">10.1016/j.radonc.2019.11.019</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Delgado</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Llorente</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Security and Privacy when Applying FAIR Principles to Genomic Information</article-title>. <source>Stud. Health Technol. Inform.</source> <volume>275</volume>, <fpage>37</fpage>&#x2013;<lpage>41</lpage>. <pub-id pub-id-type="doi">10.3233/SHTI200690</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hasnain</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rebholz-Schuhmann</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>Assessing FAIR Data Principles against the 5-Star Open Data Principles</article-title>,&#x201d; in <source>The Semantic Web: ESWC 2018 Satellite Events. ESWC 2018. LNCS</source>. Editor <person-group person-group-type="editor">
<name>
<surname>Gangemi</surname>
<given-names>A.</given-names>
</name>
</person-group> (<publisher-name>Springer</publisher-name>), <volume>Vol. 11155</volume>. </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heath</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Bizer</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Linked Data: Evolving the Web into a Global Data Space</article-title>. <source>Synth. Lectures Semantic Web: Theor. Technol.</source> <volume>1</volume>, <fpage>1</fpage>&#x2013;<lpage>136</lpage>. <pub-id pub-id-type="doi">10.2200/s00334ed1v01y201102wbe001</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Learned</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Durbin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Currie</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kephart</surname>
<given-names>E. T.</given-names>
</name>
<name>
<surname>Beale</surname>
<given-names>H. C.</given-names>
</name>
<name>
<surname>Sanders</surname>
<given-names>L. M.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Barriers to Accessing Public Cancer Genomic Data</article-title>. <source>Sci. Data</source> <volume>6</volume>, <fpage>98</fpage>. <pub-id pub-id-type="doi">10.1038/s41597-019-0096-4</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Mart&#xed;nez-Garc&#xed;a</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Parra-Calder&#xf3;n</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Chronaki</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Cangioli</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>L&#xf6;be</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Juehne</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>FAIRness for FHIR Project: Making Health Datasets FAIR Using HL7 FHIR</article-title>. <comment>Research Data Alliance [Internet]</comment>. <comment>Available from: <ext-link ext-link-type="uri" xlink:href="https://www.fair4health.eu/storage/files/Resource/49/RDA%20VP17%20-%20Poster%20FHIR4FAIR%20-%20Poster_v3.pdf">https://www.fair4health.eu/storage/files/Resource/49/RDA VP17 - Poster FHIR4FAIR - Poster_v3.pdf</ext-link>
</comment>. </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Miyakawa</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>No Raw Data, No Science: Another Possible Source of the Reproducibility Crisis</article-title>. <source>Mol. Brain</source> <volume>13</volume>, <fpage>24</fpage>. <pub-id pub-id-type="doi">10.1186/s13041-020-0552-2</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="book">
<collab>NCI Staff</collab> (<year>2021</year>). <source>Cancer Researchers Bring Tools, Experience to COVID-19 Studies</source>. <comment>[Internet]</comment>. <comment>Available from <ext-link ext-link-type="uri" xlink:href="https://www.cancer.gov/news-events/cancer-currents-blog/2021/cancer-researchers-covid-19-studies">https://www.cancer.gov/news-events/cancer-currents-blog/2021/cancer-researchers-covid-19-studies</ext-link> (cited May 19, 2021)</comment>.</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schade</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ogilvie</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Kessler</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sch&#xfc;tte</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wierling</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lange</surname>
<given-names>B. M.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>A Data- and Model-Driven Approach for Cancer Treatment</article-title>. <source>Onkologe</source> <volume>25</volume>, <fpage>132</fpage>&#x2013;<lpage>137</lpage>. <pub-id pub-id-type="doi">10.1007/s00761-019-0624-z</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Schrage</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <source>AI Is Going to Change the 80/20 Rule</source>. <comment>Harvard Business Review [Internet]</comment>. <comment>Available from: <ext-link ext-link-type="uri" xlink:href="https://hbr.org/2017/02/ai-is-going-to-change-the-8020-rule">https://hbr.org/2017/02/ai-is-going-to-change-the-8020-rule</ext-link>
</comment>.</citation>
</ref>
<ref id="B15">
<citation citation-type="other">
<person-group person-group-type="author">
<name>
<surname>Semantic</surname>
<given-names>J.</given-names>
</name>
</person-group> <source>Web Inf. Syst.</source> <volume>5</volume>, <fpage>1</fpage>&#x2013;<lpage>22</lpage>.</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stephens&#x200b;</surname>
<given-names>Z. D.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S. Y.</given-names>
</name>
<name>
<surname>Faghri</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Campbell</surname>
<given-names>R. H.</given-names>
</name>
<name>
<surname>Zhai</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Efron</surname>
<given-names>M. J.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Big Data: Astronomical or Genomical?</article-title>. <source>
<italic>PLoS Biol</italic>&#x200b; &#x200b;.</source> <volume>13</volume> (<issue>7</issue>), <fpage>e1002195</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pbio.1002195</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Tyagi</surname>
<given-names>A. K.</given-names>
</name>
</person-group> (<year>2020</year>). <source>Data Science and Data Analytics Opportunities and Challenges</source>. <edition>1st Edition</edition>. Editor <person-group person-group-type="editor">
<name>
<surname>Tyagi</surname>
<given-names>A. K.</given-names>
</name>
</person-group> <fpage>486</fpage>.</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vesteghem</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Br&#xf8;ndum</surname>
<given-names>R. F.</given-names>
</name>
<name>
<surname>S&#xf8;nderk&#xe6;r</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sommer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Schmitz</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>B&#xf8;dker</surname>
<given-names>J.&#x20;S.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Implementing the FAIR Data Principles in Precision Oncology: Review of Supporting Initiatives</article-title>. <source>Brief Bioinform</source> <volume>21</volume> (<issue>3</issue>), <fpage>936</fpage>&#x2013;<lpage>945</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbz044</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vines</surname>
<given-names>H. T.</given-names>
</name>
<name>
<surname>Albert</surname>
<given-names>A. Y. K.</given-names>
</name>
<name>
<surname>Andrew</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>D&#xe9;barre</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Bock</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Franklin</surname>
<given-names>M. T.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>The Availability of Research Data Declines Rapidly with Article Age</article-title>. <source>Curr. Biol. n</source> <volume>24</volume>, <fpage>94</fpage>&#x2013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1016/j.cub.2013.11.014</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wilkinson</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Dumontier</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Aalbersberg</surname>
<given-names>I. J.</given-names>
</name>
<name>
<surname>Appleton</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Axton</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Baak</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>The FAIR Guiding Principles for Scientific Data Management and Stewardship</article-title>. <source>Sci. Data</source> <volume>3</volume>, <fpage>160018</fpage>. <pub-id pub-id-type="doi">10.1038/sdata.2016.18</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wise</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>de Barron</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>Splendiani</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Balali-Mood</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Vasant</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Little</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Implementation and Relevance of FAIR Data Principles in Biopharmaceutical R&#x26;D</article-title>. <source>Drug Discov. Today</source> <volume>24</volume>, <fpage>933</fpage>&#x2013;<lpage>938</lpage>. <pub-id pub-id-type="doi">10.1016/j.drudis.2019.01.008</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zong</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Stone</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Sharma</surname>
<given-names>D. K.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Developing an FHIR-Based Computational Pipeline for Automatic Population of Case Report Forms for Colorectal Cancer Clinical Trials Using Electronic Health Records</article-title>. <source>JCO Clin. Cancer Inform.</source> (<issue>4</issue>), <fpage>201</fpage>&#x2013;<lpage>2099</lpage>. <comment>[Internet]</comment>. <pub-id pub-id-type="doi">10.1200/CCI.19.00116</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>