<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Immunol.</journal-id>
<journal-title>Frontiers in Immunology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Immunol.</abbrev-journal-title>
<issn pub-type="epub">1664-3224</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fimmu.2021.735609</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Immunology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>The Cancer Epitope Database and Analysis Resource: A Blueprint for the Establishment of a New Bioinformatics Resource for Use by the Cancer Immunology Community</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Ko&#x15f;alo&#x11f;lu-Yal&#xe7;&#x131;n</surname>
<given-names>Zeynep</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1191697"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Blazeska</surname>
<given-names>Nina</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1283216"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Carter</surname>
<given-names>Hannah</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Nielsen</surname>
<given-names>Morten</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/479847"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cohen</surname>
<given-names>Ezra</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kufe</surname>
<given-names>Donald</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/37112"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Conejo-Garcia</surname>
<given-names>Jose</given-names>
</name>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1267473"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Robbins</surname>
<given-names>Paul</given-names>
</name>
<xref ref-type="aff" rid="aff9">
<sup>9</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/825756"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Schoenberger</surname>
<given-names>Stephen P.</given-names>
</name>
<xref ref-type="aff" rid="aff10">
<sup>10</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Peters</surname>
<given-names>Bjoern</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/487574"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Sette</surname>
<given-names>Alessandro</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/140600"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Center for Infectious Disease and Vaccine Research, La Jolla Institute for Immunology</institution>, <addr-line>La Jolla, CA</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Medicine, University of California San Diego</institution>, <addr-line>La Jolla, CA</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Moore&#x2019;s Cancer Center, University of California San Diego</institution>, <addr-line>La Jolla, CA</addr-line>, <country>United States</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Bio and Health Informatics, Technical University of Denmark</institution>, <addr-line>Lyngby</addr-line>, <country>Denmark</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Instituto de Investigaciones Biotecnol&#xf3;gicas, Universidad Nacional de San Mart&#xed;n</institution>, <addr-line>San Mart&#xed;n</addr-line>, <country>Argentina</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Dana Farber Cancer Institute, Harvard Medical School</institution>, <addr-line>Boston, MA</addr-line>, <country>United States</country>
</aff>
<aff id="aff7">
<sup>7</sup>
<institution>Department of Gynecologic Oncology, H. Lee Moffitt Cancer Center and Research Institute</institution>, <addr-line>Tampa, FL</addr-line>, <country>United States</country>
</aff>
<aff id="aff8">
<sup>8</sup>
<institution>Department of Immunology, H. Lee Moffitt Cancer Center and Research Institute</institution>, <addr-line>Tampa, FL</addr-line>, <country>United States</country>
</aff>
<aff id="aff9">
<sup>9</sup>
<institution>National Cancer Institute, National Institutes of Health</institution>, <addr-line>Bethesda, MD</addr-line>, <country>United States</country>
</aff>
<aff id="aff10">
<sup>10</sup>
<institution>Laboratory of Cellular Immunology, La Jolla Institute for Immunology</institution>, <addr-line>La Jolla, CA</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Olivera J. Finn, University of Pittsburgh, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Pramod Kumar Srivastava, University of Connecticut, United States; Hans-Georg Rammensee, University of T&#xfc;bingen, Germany</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Alessandro Sette, <email xlink:href="mailto:alex@lji.org">alex@lji.org</email>
</p>
</fn>
<fn fn-type="other" id="fn002">
<p>This article was submitted to Cancer Immunity and Immunotherapy, a section of the journal Frontiers in Immunology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>24</day>
<month>08</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>735609</elocation-id>
<history>
<date date-type="received">
<day>02</day>
<month>07</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>08</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Ko&#x15f;alo&#x11f;lu-Yal&#xe7;&#x131;n, Blazeska, Carter, Nielsen, Cohen, Kufe, Conejo-Garcia, Robbins, Schoenberger, Peters and Sette</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Ko&#x15f;alo&#x11f;lu-Yal&#xe7;&#x131;n, Blazeska, Carter, Nielsen, Cohen, Kufe, Conejo-Garcia, Robbins, Schoenberger, Peters and Sette</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Recent years have witnessed a dramatic rise in interest towards cancer epitopes in general and particularly neoepitopes, antigens that are encoded by somatic mutations that arise as a consequence of tumorigenesis. There is also an interest in the specific T cell and B cell receptors recognizing these epitopes, as they have therapeutic applications. They can also aid in basic studies to infer the specificity of T cells or B cells characterized in bulk and single-cell sequencing data. The resurgence of interest in T cell and B cell epitopes emphasizes the need to catalog all cancer epitope-related data linked to the biological, immunological, and clinical contexts, and most importantly, making this information freely available to the scientific community in a user-friendly format. In parallel, there is also a need to develop resources for epitope prediction and analysis tools that provide researchers access to predictive strategies and provide objective evaluations of their performance. For example, such tools should enable researchers to identify epitopes that can be effectively used for immunotherapy or in defining biomarkers to predict the outcome of checkpoint blockade therapies. We present here a detailed vision, blueprint, and work plan for the development of a new resource, the <bold>C</bold>ancer <bold>E</bold>pitope <bold>D</bold>atabase and <bold>A</bold>nalysis <bold>R</bold>esource (CEDAR). CEDAR will provide a freely accessible, comprehensive collection of cancer epitope and receptor data curated from the literature and provide easily accessible epitope and T cell/B cell target prediction and analysis tools. The curated cancer epitope data will provide a transparent benchmark dataset that can be used to assess how well prediction tools perform and to develop new prediction tools relevant to the cancer research community.</p>
</abstract>
<kwd-group>
<kwd>cancer</kwd>
<kwd>epitope analysis</kwd>
<kwd>database (all types)</kwd>
<kwd>neoantigen</kwd>
<kwd>bioinformatics</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Cancer Institute<named-content content-type="fundref-id">10.13039/100000054</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">National Cancer Institute<named-content content-type="fundref-id">10.13039/100000054</named-content>
</contract-sponsor>
<counts>
<fig-count count="7"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="81"/>
<page-count count="14"/>
<word-count count="7571"/>
</counts>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Recent years have witnessed a dramatic rise in interest towards cancer epitopes, studies that have been greatly facilitated by the dramatic decrease in the cost of whole-exome and transcriptome sequencing, as well as advances in mass spectrometry that has resulted in the generation of large datasets of candidate T cell epitopes that are naturally processed and presented (<xref ref-type="bibr" rid="B1">1</xref>). This resurgence of interest is linked to the exceptional success of immune checkpoint blockade therapies that disengage immune suppressive mechanisms and enable cancer antigen-specific T cells to recognize and attack tumor cells expressing those antigens (<xref ref-type="bibr" rid="B2">2</xref>&#x2013;<xref ref-type="bibr" rid="B4">4</xref>). Additionally, current research suggests that combining checkpoint blockade treatment and neoantigen-directed therapies, such as vaccines or adoptive T cell transfer, can enhance treatment efficacy (<xref ref-type="bibr" rid="B5">5</xref>). More recently, checkpoint blockade therapies have been expanded to the neoadjuvant pre-surgical setting, where the aim is to enhance systemic immunity against a broader set of tumor antigens to eliminate micro-metastatic tumors that would otherwise be the source of a relapse (<xref ref-type="bibr" rid="B6">6</xref>). Despite these advances, only a subset of patients benefits from these immunotherapies.</p>
<p>Comprehensively cataloging all cancer epitope-related data linked to the biological, immunological, and clinical contexts will aid in understanding the biological mechanisms associated with efficacy and developing more effective therapeutic approaches. In parallel, researchers need access to computational epitope prediction and analysis tools but also need resources to aid in objective evaluation of the performance of different predictive strategies.</p>
<p>There have been several recent efforts to address these needs. The TANTIGEN 2.0 database (<xref ref-type="bibr" rid="B7">7</xref>) contains curated epitope and ligand elution data for many different cancer antigens, such as neoantigens and differentiation antigens. However, TANTIGEN does not include peptides that were shown to be ineffective and also lacks any association with clinical data. Similarly, The Cancer Antigenic Peptide Database (<uri xlink:href="https://caped.icp.ucl.ac.be">https://caped.icp.ucl.ac.be</uri>) also only includes curated epitope data for several different cancer antigens. NEPdb (<xref ref-type="bibr" rid="B8">8</xref>) contains curated neoantigens but lacks any other types of cancer antigens. For cataloged neoepitopes, associated receptor information and clinical data are also provided if available. It is possible to query NEPdb for an epitope sequence of interest, but there is no option to search for receptors. dbPepNeo (<xref ref-type="bibr" rid="B9">9</xref>) only contains curated HLA class I restricted neoantigens and ligand elution data. Importantly, while all resources provide some basic tools to query the databases for cancer types and peptide sequences, it is not possible to perform specific and granular queries. These resources do also not allow the user to perform any predictions for peptides of interest.</p>
<p>To fill these gaps, we here describe the plans and blueprint to develop a new resource, the Cancer Epitope Database and Analysis Resource (CEDAR). CEDAR is envisioned as a comprehensive bioinformatics resource, which will provide access to curated cancer epitope data, including mutated and non-mutated cancer epitopes, and bioinformatics tools for epitope and receptor analysis and prediction. The work proposed here will build on the Immune Epitope Database (IEDB), in existence since 2003, fully operational and independently funded until at least 2025 by the National Institute of Allergy and Infectious Diseases (NIAID) (<xref ref-type="bibr" rid="B10">10</xref>). The IEDB&#x2019;s focus is on allergy, infectious disease, transplantation, and autoimmunity but does not include cancer. Analogous to the IEDB, CEDAR will include all cancer-specific epitope data from various T&#xa0;cell and B cell experiments, MHC binding assays, and MHC ligandomics by mass-spectrometry. CEDAR will also include results from <italic>in vivo</italic> experiments such as tumor rejection and/or tumor control data. The granular curation of the data and the flexible query structure of CEDAR will allow the user to perform detailed queries to retrieve epitopes supported by different experimental data.</p>
<p>We believe that CEDAR will address an existing need because there is currently no comprehensive informatics resource available to the scientific community that stores data on cancer epitopes, the receptors that recognize them, and the immunological, clinical, and biological context in which they are recognized. In addition to a database of cancer epitopes, CEDAR will provide a set of analysis and prediction tools that will enable cancer researchers to predict putative epitope targets in a tumor sample of interest and also predict the likely specificity of T cell receptors (TCR) or B cell receptors (BCR) identified in single-cell sequencing data. CEDAR will also include benchmarking of existing epitope prediction tools and provide side-by-side comparisons of performance. The significance of these features lies in their utility for the broader community of cancer researchers. Currently, many cancer researchers are using the IEDB and its related tools to attempt to answer questions like this, which is suboptimal given that the IEDB was designed for applications outside of cancer (<xref ref-type="bibr" rid="B11">11</xref>).</p>
</sec>
<sec id="s2" sec-type="results">
<title>Results</title>
<sec id="s2_1">
<title>A Plan to Define the CEDAR Database Scope Based on the Salient Characteristics of Cancer Epitope Data and Metadata</title>
<p>Following initial interviews with cancer experts, we identified the elements relating to an epitope that should be captured in CEDAR (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>), including seven main &#x201c;field groups&#x201d;, namely (1) related to the structure of the epitope, (2) the protein/antigen source from which the epitope is derived, (3) the host associated with the identified epitope responses, (4) the features of the tumor sample, isolate or model, (5) the effectors of the immune responses (both B and T cell responses), (6) the ability and modality of the effector responses to recognize the epitope and cancer cells, and (7) the source of the information that is captured. CEDAR will also identify whether the information captured is derived from a scientific publication, through a direct submission to CEDAR, or gathered from other online resources, and in each case, clearly state the provenance information.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Summary of salient characteristics of cancer epitope data and metadata for CEDAR.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-735609-g001.tif"/>
</fig>
</sec>
<sec id="s2_2">
<title>Structure and Antigen Source of the Epitope and Type of Cancer Mutations</title>
<p>Different fields and subfields were defined to enable capturing information in a granular yet searchable and accurate fashion. First, we designated fields to capture the amino-acid sequence of the epitope together with associated post-translational modifications such as phosphorylation and glycosylation. In the case of non-peptidic epitopes, such as, for example, CHO epitopes recognized by antibody responses or ceramides used to expand natural killer (NK) T cells, the structures are captured following the format of ChEBI (<xref ref-type="bibr" rid="B12">12</xref>) and PubChem (<xref ref-type="bibr" rid="B13">13</xref>) resources.</p>
<p>We next defined a set of fields to indicate the general characteristics of the antigen. Specific fields distinguish and classify mutated epitopes (neoepitopes), tumor-associated antigens (TAA) such as differentiation or tissue-specific antigens (e.g., Melan-A, PSA), overexpressed antigens (e.g., HER-2, Muc-1), or cancer-germline antigens (e.g., MAGE, NY-ESO1). For peptidic antigens encoded in the host genome, we defined subfields to capture the gene and protein names of the unmodified antigen, the type [e.g., a self-protein or endogenous retroelement antigens such as long terminal repeats (LTR) or endogenous retroviruses (ERVs) (<xref ref-type="bibr" rid="B14">14</xref>)], and its frequency and magnitude of expression in healthy tissues for different tissue and cell types, as well as developmental stages (<xref ref-type="bibr" rid="B15">15</xref>). For non-peptidic self-antigens such as carbohydrates or gangliosides, we defined fields to record their presence in different tissues. Similarly, for epitopes derived from non-self-tumor-associated antigens, specific antigens are captured (e.g., protein from HPV). We designated a final set of fields to capture normal properties associated with the antigen, such as subcellular location and involvement in biological functions based on GeneOntology (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B17">17</xref>), and whether the antigen is a driver gene, known to be causally linked to cancer progression (i.e., oncogene, tumor suppressor gene). A set of subfields also captures expression in pre-malignancies and the frequency and magnitude of expression in various tumor types (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B19">19</xref>) and cancer cell lines (<xref ref-type="bibr" rid="B20">20</xref>).</p>
<p>We designated a distinct but equally important set of fields to capture the type of cancer mutations in the source antigen and their impact on the antigen, including the mutation type, such as single or multi nucleotide variants, frameshift, or non-frameshift indels and chromosomal rearrangements. The effect of the mutation (coding: missense or premature stop codon, frameshift, synonymous; non-coding: splice sites, UTR or other), and the outcome of the mutation on the antigen, distinguishing dysregulated expression, functional impact of the mutation on source antigen (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B22">22</xref>), structural localization of mutation impact (<xref ref-type="bibr" rid="B23">23</xref>), localization in functional domains (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B24">24</xref>), and known or predicted surface accessibility (<xref ref-type="bibr" rid="B23">23</xref>) are captured in additional subfields.</p>
</sec>
<sec id="s2_3">
<title>Fields Related to the Host Organism</title>
<p>We designated a set of fields and subfields to capture the organism associated with the epitope response in terms of species (most references will either be related to human responses or tumor animal models, primarily mice or rats), age, sex, strain or ethnicity, and the major histocompatibility complex (MHC). A separate set of fields was defined to capture the general feature of the cancer, such as natural occurrence and known associated risk factors <italic>versus</italic> induced cancers (genetically engineered organism with spontaneous tumor, xenograft, cancerogenic treatment induced). Cancer classification and diagnosis are captured in designated subfields as well, including anatomical site, histology, tumor stage, and any type of pre-treatment. Additional subfields capture relevant characteristics of the host, such as microsatellite instability (MSI) and HPV status. If the subject from which the responses were derived was vaccinated, the specifics of such treatment are captured in terms of the vaccine antigen delivery format (synthetic peptide, mRNA, DNA plasmid, viral vector, and so on), adjuvant used, administration specifics, and formulation details. Additional fields were designated to capture other types of immunotherapies such as adoptive cell therapy (tumor-infiltrating lymphocytes (TIL) therapy, engineered TCR therapy, chimeric antigen receptor (CAR) T cell therapy, natural killer (NK) cell therapy), and checkpoint blockade therapy (e.g., anti-PD-1, anti-CTLA-4 therapy). If available, doses and dose sizes, information about targeted antigens, corresponding TCR sequences, 3D structures, and therapeutic interventions such as treatments with chemotherapy, radiation, surgery, or oncolytic viruses can be captured as well. Defined subfields will also capture clinical outcome, such as complete response, partial response, or cancer progression, and overall or progression-free survival, as well as reduction of tumor burden, change in tumor markers, and any adverse events of therapy, including autoimmune reactions.</p>
<p>We also designated fields to document the sample, isolate, or model associated with the source antigen of the epitope. Specifically, the sample nature (primary sample/short-term line vs. stable cell line), its occurrence (primary, metastasis, recurring), and whether the sample was obtained pre- or post-treatment. If available, tumor sample purity is also captured (from histology or predicted from sequencing data), as well as the overall mutational burden of the sample. Any available evidence for epitope/antigen expression in terms of frequency and magnitude of epitope/antigen expression in the sample is also documented. Importantly, CEDAR has designated fields to capture the evidence type for the epitope/antigen as detected in whole-genome, whole-exome, transcriptome, or targeted gene panel sequencing, together with the depth and coverage at the epitope site. In the event of a mutated antigen, details related to the mutation are stored, such as its origin (somatic/germline), tools that reported the mutation, read depth at the mutation site, and variant allele frequencies in the tumor DNA sample and RNA sample, if available. Supporting mass-spectrometry elution data are also be captured if available. A separate set of fields was defined to document features related to the tumor environment, including the presence of T cells and characterized subsets.</p>
<p>CEDAR will also include results from <italic>in vivo</italic> experiments such as tumor rejection and/or tumor control data. In such cases, details about the used mouse models or the patients from clinical trials will also be captured.</p>
</sec>
<sec id="s2_4">
<title>Fields Related to Capturing Immune Responses</title>
<p>CEDAR aims to capture the general features of the effector material, including the source of effector cells or antibodies, whether they were (<italic>ex vivo</italic>) T cells, short-term cultured or stable cell lines that were isolated from a tumor-affected host, or whether they were induced/engineered cell lines. Information related to antibody class and subclass and cell phenotypes, including CD4/CD8/NKT subset data and expression of phenotypic markers, is also captured. If available, corresponding TCR and antibody sequences, as well as 3D structures, will also be documented, considering the different levels of resolution associated with various techniques such as targeted sequencing of CDR3 regions and full-length TCR sequencing. We also designated subfields for possible synonymous TCR or BCR sequences encoded by different V(D)J sequences, with the opportunity to capture evidence of immunoediting or antigen loss, if available.</p>
<p>In addition to this, CEDAR also documents the specific assays performed to measure recognition. Examples include ELISPOT, intracellular cytokine staining (ICS) or tetramer assays for T cells, ELISA, antibody-dependent cell-mediated cytotoxicity (ADCC), and fluorescence assays for antibodies. A separate series of fields were defined to capture the effector mode of recognition, namely the capacity to recognize tumor cells directly, cell lines transfected with RNA, or cell lines pulsed with peptides. Particularly relevant for MHC class II-restricted responses is the curation of the type of antigen-presenting cell (APC) involved in the assay determination. A final and most crucial set of fields was defined to capture the results of the assessment, as available in qualitative (positive/negative) and quantitative (magnitude) terms. Importantly, the quality of negative controls associated with the assay, such as data related to MHC and antigen expression, will be carefully curated because a negative result is not valid if the MHC or antigen is not expressed. CEDAR will also capture the number of subjects tested/responded, the type of tested &#x2018;target&#x2019;, and in the case of mutated epitopes, whether both mutated and wildtype peptides were tested, and the associated outcomes.</p>
</sec>
<sec id="s2_5">
<title>Mapping Database Fields to Community-Supported Standards/Ontologies</title>
<p>In our planning and blueprint development for CEDAR, we have drawn on our experience operating the Immune Epitope Database (IEDB). Our extensive experience with the IEDB, which we initiated in 2003 and have been maintaining and enhancing over the past 18 years, has provided us with important lessons on what to do and, more importantly, what not to do when designing and maintaining an epitope database and analysis resource. By multiple metrics, the IEDB is a success, with &gt;4,000,000 experiments characterizing &gt;1,300,000 epitopes from &gt;22,000 references curated; a monthly rate of &gt;30,000 unique visitors, and over &gt;3,900 citations per year (based on 2020 data). Importantly, even though the IEDB is currently not funded to respond to the needs of the cancer community, up to one-third of current IEDB users are applying its functionality in a cancer research setting. As part of our outreach activities, we have gathered requests from these users on how the IEDB could be improved for cancer researchers.</p>
<p>To accurately represent epitope information, the IEDB has developed a semantically well-defined data structure, which utilizes community-supported ontologies for most of its specific fields (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). The core of this data structure has proven to be remarkably flexible and robust, as it has been used to capture over 4 million assay records to date, enabling powerful aggregate queries on epitope information gathered in diverse settings. For example, for epitopes derived from viruses, the NCBI taxonomy is used to capture the particular virus that the epitope is known to originate from. This enables us to capture all synonymous names used to refer to that particular entity (&#x201c;Human Papillomavirus 16&#x201d; or &#x201c;HPV16&#x201d; or &#x201c;Human Papillomavirus type 16&#x201d;). It also allows storing and querying for information at different levels of granularity, such as obtaining all epitopes derived from viruses in the genus &#x201c;Alphapapillomavirus&#x201d; or specifying that an epitope was found in a particular isolate of HPV16. As other knowledge resources use the same NCBI taxonomic framework to represent organisms, it makes our data FAIR (findable, accessible, interoperable, and reusable) (<xref ref-type="bibr" rid="B25">25</xref>), which is particularly important for the (re-)use of IEDB data by the broader science community (<xref ref-type="bibr" rid="B26">26</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>IEDB high-level structure and ontological backbone.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-735609-g002.tif"/>
</fig>
<p>We plan to follow the same paradigm in CEDAR and will ensure that each database field can be mapped to an accessible, community-supported ontology. For fields where the scope overlaps with the IEDB, the same standards can simply be re-used. For database fields that are specific to cancer, standards/ontologies will need to be identified to curate them accurately. We&#xa0;have already identified the need for additional cancer-specific disease terms, including disease states and stages. Disease states will continue to be described using Disease Ontology (DO) (<xref ref-type="bibr" rid="B27">27</xref>) terms, which will be expanded and refined to include all cancer terms. Additionally, all cancer-related disease terms will be grouped under the parent term &#x2018;neoplasm&#x2019;, which aligns with the classification of cancers in the National Cancer Institute Thesaurus (NCIT) (<xref ref-type="bibr" rid="B28">28</xref>). Similarly, the NCIT terms will be used to specify cancer stages and link these terms to their official NCIT definitions and identifiers. Our team is proficient in working with vocabulary providers and standardization efforts, and we will enthusiastically embrace recommendations and/or participate in efforts to develop data standards within the ITCR and general cancer research community.</p>
</sec>
<sec id="s2_6">
<title>Development and Implementation of a Web-Enabled Query and Reporting Interface</title>
<p>One of the challenges for biomedical community databases is to ensure that the query interfaces are intuitive and that the generated reports provide understandable and scientifically accurate results. An initial design for the CEDAR web query interface (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>) focuses on making the most requested pieces of information immediately accessible. This query interface shares fields with those present in the IEDB for epitope structure, host, assays used to characterize the response, and MHC-restriction. At the same time, it enables the direct query for the source of the epitope as it is relevant to cancer, namely source antigen, neoplasm, immune response induction, and treatment. We anticipate adding antigen subtypes, a characterization of the neoplasm/tumor, the ability to select methods used to induce immune responses, and information on the treatment a host was undergoing. It will, for example, be possible to search for all epitopes in a given cancer type or epitopes associated with a specific mutation or gene of interest. The granular curation of the data and the flexible query structure of CEDAR will allow for example to retrieve data related to either natural presentation, recognition of synthetic antigens or both. More detailed searches will also be possible, such as searching for a specific type of assay or for instances where a specific type of treatment occurred.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Draft of cancer-specific query interface for CEDAR web portal. Highlighted in light blue are areas that include cancer-specific search parameters not present in the current IEDB interface.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-735609-g003.tif"/>
</fig>
</sec>
<sec id="s2_7">
<title>Background on the IEDB Curation Process</title>
<p>To identify and curate relevant publications that contain experimental cancer epitope data, CEDAR will utilize the validated curation approach established and optimized for the IEDB and modify specific steps where required. Over the last 18 years, we have developed, implemented, and continuously optimized the process to identify relevant journal articles for the IEDB and extract information from them, as outlined in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>. Scientific literature is constantly monitored by querying the PubMed database on a biweekly basis with broad keyword queries, purposely designed to be comprehensive, in order to retrieve a broad universe of papers that should include all references describing immune epitopes. Over time, these specialized, broad queries have selected over 244,000 references from over 32 million papers available in PubMed.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Workflow for identifying curatable journal articles.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-735609-g004.tif"/>
</fig>
<p>Based on the abstract, automated text classifier tools and human experts then narrow these references down to those with likely relevance (<xref ref-type="bibr" rid="B29">29</xref>&#x2013;<xref ref-type="bibr" rid="B31">31</xref>). The criteria for passing this initial selection require that the reference is within the scope of the database, provide novel data (for example, review papers and use of epitopes as a mere marker or tag are excluded), and describe the epitope molecular structure in sufficient detail and granularity (reports of simple reactivity against whole proteins or undefined structures are excluded). Following these determinations, the reference is classified as &#x201c;relevant&#x201d;, and further subdivided into a specific disease category. The full text of relevant articles is then retrieved and assigned to a doctoral-level curator who extracts the data and enters it into the IEDB database curation system. The curated records are peer-reviewed, and once accepted, become visible to the public. The general curation processes are described in detail in previous publications (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B32">32</xref>&#x2013;<xref ref-type="bibr" rid="B34">34</xref>) and have been continuously adapted as new assay types are established, as has been done to capture receptor data from high throughput sequencing (<xref ref-type="bibr" rid="B35">35</xref>).</p>
</sec>
<sec id="s2_8">
<title>Development of a Prioritized Queue of Cancer-Related Articles for Curation</title>
<p>In preparation for cancer curation, papers that contain curatable epitope information as part of the IEDB curation workflow were further categorized by the use of automated text classifiers (<xref ref-type="bibr" rid="B29">29</xref>&#x2013;<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B36">36</xref>) and manual inspection, in broad primary classes (Cancer, Infectious Diseases (excluding HIV which is curated by the Los Alamos database), Allergy, Autoimmunity, Transplantation and &#x201c;Other&#x201d;. The percentage of references classified in each of these broad categories is shown in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>. Cancer references account for 10.6% of all identified and curatable epitope references. These references were further subdivided into a set of 20 subcategories, grouped as a function of similar antigens and/or cancer types. The most frequent category is melanoma antigens (MAA, 20%), reflecting the prominence of these antigen types in immunological investigations. Other frequent categories are carbohydrate antigens such as Lewis and related antigens (LEWIS, 3.3%), and popular antigens such as mucin (5.5%), Her2 and associated antigens (6.4%), MAGE and associated antigens (4.8%), prostate associated antigens (PROS, 4.0%), p53 (2.6%), antigens associated with lymphoid cancers (LEU, 5.6%), and CEA (2.1%). Neoepitope references were classified separately and presently account for only 5.0%; however, the number of papers in this category has been rapidly rising in recent years.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Breakdown of classified and curatable references.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-735609-g005.tif"/>
</fig>
<p>In addition to this, we plan to inspect and broaden the initial PubMed query by adding keywords to ensure we capture all cancer epitope-specific articles. Our automated document classifier will be re-trained to specifically identify articles that contain cancer epitope-specific information, as we have done for other categories before. Different categories will be addressed in a sequential fashion. Our current first priority for curation includes neoepitopes and T cell epitopes associated with melanoma, breast, and prostate cancers, as these are among the most frequently studied in basic investigations and clinical trial settings.</p>
</sec>
<sec id="s2_9">
<title>Curating Previously Identified Relevant Cancer Articles With Immune Epitope Data</title>
<p>To begin curation of cancer epitope literature, curators will follow the curation rules encoded in the IEDB curation manual, a living document (<xref ref-type="bibr" rid="B37">37</xref>), which will be expanded and customized for CEDAR. In brief, for each epitope entered into the database, the structure of the epitope, i.e., an amino acid sequence for peptidic epitopes and a chemical structure for non-peptidic epitopes, is described. If the epitope is naturally occurring, the protein and organism from which the epitope was derived are also entered; for example, the human melanoma antigen recognized by T cells 1 (MART-1) protein. Additionally, all experimental assays in which the epitope was studied are added as T cell, B cell, or MHC ligand assays. The details of each assay include information such as the host, whose immune response was studied, the disease state and stage of the individual, the type of effector cells (CD8+ T cells) or antibodies (monoclonal IgG1) being studied, and the assay method (ELISA, flow cytometry, etc.) that was utilized. Curation also captures the sequences of the epitope-specific TCRs and BCRs.</p>
<p>Curators capture data by entering it into dynamic and interactive web forms designed to optimize productivity and to ensure accurate and consistent data entry. This curation interface enforces curation rules as the curator enters the data, which takes advantage of the ontology-based data structure on a per-field basis. Once the curator has completed entering the data, additional validation rules that cross-compare the content of different fields are checked by the system prior to allowing the curation to be submitted. Just as development will be required on front-end user interfaces to support cancer-specific query and reporting better, the back-end curation system will also require development to allow for appropriate data entry. This system will be updated in coordination with the query and reporting interface development described above and based on the outreach feedback described below.</p>
</sec>
<sec id="s2_10">
<title>Curated Cancer Epitope Datasets for Benchmarking Epitope Prediction Tools</title>
<p>The following sections describe the benchmarking, improvement and development of epitope prediction methods. The results epitope predictions will lead to validation experiments determining which epitopes are actually of biological significance, which is arguably the ultimate goal. These results&#xa0;will, in a recursive modality, be fed back into training of epitope predictions, leading to increased prediction accuracy and significance.</p>
<p>Multiple computational tools and pipelines have been developed to predict cancer epitopes in the scientific community (<xref ref-type="bibr" rid="B38">38</xref>). The comprehensive sets of epitopes curated in CEDAR can be used to evaluate the performance of these tools. These benchmarking results will inform tool developers on the most valuable prediction approaches and tool users on which tools they can most rely on. Moreover, the epitope datasets created in this process will be valuable for the broader community in developing new tools. Since many of the tools evaluated will have been trained on subsets of existing data, &#x2018;live benchmarks&#x2019; will also be implemented, which consist of automated pipelines that run predictions on epitope datasets just before they are released in CEDAR. We have previously implemented such &#x2018;live-benchmarks&#x2019; for MHC class I (<xref ref-type="bibr" rid="B39">39</xref>) and MHC class II (<xref ref-type="bibr" rid="B40">40</xref>) binding predictions in the IEDB, and the framework established for these is easily expandable for CEDAR.</p>
<p>We previously performed a small benchmark on the predictability of cancer T cell epitopes with different prediction approaches (<xref ref-type="bibr" rid="B41">41</xref>). More comprehensive studies can be performed by taking advantage of the curation activities described above, which will already have translated the free text information from journal articles into a structured format. The granular curation in CEDAR will allow to distinguish different datasets, such as peptides shown to <italic>i)</italic> bind MHC, <italic>ii)</italic> be naturally processed and presented by MHC, <italic>iii)</italic> be recognized by T cells when provided as a synthetic antigen, and <italic>iv)</italic> be recognized by T cells as part of a tumor cell. Providing separate datasets for separate biological questions makes it easier for tool developers and users to communicate what a specific algorithm was trained and evaluated on.</p>
<p>We plan to extract these datasets focusing on high-quality experimental records and will make them accessible in formats that can be easily parsed with commonly utilized machine learning algorithms and data analysis packages. We plan to add columns containing additional factors that can help in the predictions. For example, based on the tumor type, the expression level of different source antigens can be estimated using National Cancer Institute (NCI) databases such as cBioPortal (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B42">42</xref>) and the GDC Data Portal (<xref ref-type="bibr" rid="B43">43</xref>), even if that expression data is not specifically measured in the original experiments.</p>
</sec>
<sec id="s2_11">
<title>Development of Novel Tools to Predict Cancer Epitopes</title>
<p>While most methods for predicting cancer T cell epitopes evolve around MHC binding prediction, which is a necessary step for an epitope to be recognized by T cells, other factors, such as the abundance of the epitope (or its precursors) in the tumor and the availability of a TCR repertoire capable of recognizing the epitope, influence T cell recognition. A thorough assessment of the importance of these different features is required, and CEDAR will provide independent datasets continuously acquired over time through the above-described curation process. Here we describe features that have been considered by multiple investigators as drivers of differential immune recognition (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B44">44</xref>&#x2013;<xref ref-type="bibr" rid="B49">49</xref>).</p>
<p>We and others have performed analyses correlating measures of the abundance of an MHC ligand with its likelihood to be recognized by T cells (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B46">46</xref>&#x2013;<xref ref-type="bibr" rid="B48">48</xref>, <xref ref-type="bibr" rid="B50">50</xref>). For cancer epitopes that arise from a mutation (neoepitopes), the abundance is expected to correlate with the frequency of the mutation in the tumor DNA, as well as with the RNA expression level. Our preliminary analysis of in-house data, as well as data recently published from the NCI (<xref ref-type="bibr" rid="B46">46</xref>), showed that the variant allele frequency in the RNA is significantly correlated with neoantigen recognition (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). Thus, including a measure of epitope abundance into machine learning methods is expected to improve cancer epitope prediction. Accordingly, for non-mutated cancer epitopes, the abundance of the associated source antigen, for example as measured by RNA-Seq or proteomic analysis, might improve epitope prediction and will be analyzed in detail.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>RNA correlation with neoantigen recognition.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-735609-g006.tif"/>
</fig>
<p>The TCR repertoire is shaped by both central and peripheral tolerance. Specifically, T cells with receptors binding to self-peptides are expected to undergo apoptosis or adopt a regulatory phenotype. Thus, we and others have hypothesized that peptides with high similarity to host peptides have a lower likelihood to be recognized by T cells (<xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B49">49</xref>, <xref ref-type="bibr" rid="B51">51</xref>, <xref ref-type="bibr" rid="B52">52</xref>). For cancer epitopes, the similarity to self-peptides is expected to be of particular relevance, given that - by definition - cancer epitopes are highly similar to host peptides. It will be important to develop metrics of peptide similarity that correlate best with peptide immunogenicity in a cancer epitope setting and determine if they improve the performance of epitope immunogenicity predictions (<xref ref-type="bibr" rid="B53">53</xref>). Furthermore, it has been hypothesized that, as TCRs have evolved to be cross-reactive for similar epitopes in order to provide protection from rapidly evolving pathogens (<xref ref-type="bibr" rid="B54">54</xref>, <xref ref-type="bibr" rid="B55">55</xref>), cancer epitopes with similarity to pathogen sequences may be more immunogenic, and this similarity may correlate with clinical outcome (<xref ref-type="bibr" rid="B56">56</xref>). It was also suggested that neoantigens from driver genes are more likely to be recognized by T cells (<xref ref-type="bibr" rid="B46">46</xref>).</p>
<p>As entries in CEDAR will be linked to specialized databases that host such information, we will be able to easily access all information and include it in the training of machine learning methods. The Cancer Genome Atlas (TCGA), the Catalogue Of Somatic Mutations In Cancer (COSMIC) (<xref ref-type="bibr" rid="B57">57</xref>), and the Cancer Gene Census (CGC) (<xref ref-type="bibr" rid="B57">57</xref>) are all examples of databases that can be utilized to retrieve information about recurrent cancer mutations and whether a mutation is affecting a driver gene or not. Newly generated sets of experimentally validated T cell epitopes that will become available in CEDAR will allow users to assess specific hypotheses, such as mentioned above and <italic>in silico</italic> prediction pipelines in general, that were created and tested on limited datasets.</p>
<p>Using the newly curated datasets from CEDAR, different combinations of features can be included in training machine learning methods to optimize the prediction of epitope recognition (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>). The model can be trained to predict any cancer-epitope related outcome, such as cancer epitope recognition <italic>in vitro</italic> or <italic>in vivo activity</italic> (such as tumor regression or experimental model outcomes). With more epitope data becoming available, we will regularly update classifiers and assess whether the data contains additional features (including specificity to TCRs) that might be of relevance for predicting cancer epitopes. We estimate that the size of the training data set made available through the CEDAR curation of approximately 1,770 references will equal at least 50,000 epitopes, based on a comparison of the current epitope count in the IEDB. This data set should be sufficiently large to explore multiple training strategies and features for consideration.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Schematic of an Artificial Neural Network we could implement to learn determinants of Cancer Epitope Recognition.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-735609-g007.tif"/>
</fig>
</sec>
<sec id="s2_12">
<title>Development of Cancer Epitope Analysis Tools</title>
<p>In our interactions with cancer immunologists and clinicians, it was pointed out that immunoinformatics tools to predict MHC binding and antigen-processing are not user-friendly, as they often require elaborate pre- and post-processing of input and output data to make them applicable in the cancer setting. We identified several recurrent operations involved in analyzing cancer epitopes, and we plan to create analysis tools that allow automation and integration into cancer epitope-specific pipelines.</p>
<p>Determining what neo-peptides are generated by a given mutation, for example, is non-trivial when complex mutations such as frameshifts or splicing variants are involved. We plan to provide tools to generate lists of overlapping n-mers to be included in experiments, given a mutation of interest (e.g., KRAS G12V or chr:12 341234 A&lt;T).</p>
<p>It is also of interest to identify if a given mutation or peptide has already been tested for immunogenicity, and if so, in what context. CEDAR will be interlinked with specialized databases such as TCGA, COSMIC, the CGC, and dbSNP, as mentioned above. We plan to develop tools to retrieve all available information for a given mutation, including if a given peptide has already been described in CEDAR (as a cancer epitope) or the IEDB (e.g., for pathogen-derived epitopes) and whether it is found elsewhere in the host proteome. Another important analysis tool will provide MHC binding predictions for a set of mutated and associated wildtype sequences in the context of a set of MHC alleles.</p>
<p>Likewise, it is of interest to determine if TCR or BCR sequences have been described before. For CEDAR, all published cancer-specific receptor sequences and their recognized cancer epitopes will be curated. This combined database will provide a comprehensive list of receptor sequences and the epitopes they recognize. We have developed a &#x2018;receptor lookup&#x2019; tool (<xref ref-type="bibr" rid="B58">58</xref>), which accepts the TCR &#x3b2; chain CDR3 sequence as an input, and identifies if TCRs with that exact sequence (or a highly similar one) have been previously characterized, and if so, what the previously identified epitope specificity is. This tool was designed to handle large input datasets, such as those generated by TCR repertoire sequencing experiments, and will annotate for each receptor if it has been found before and what epitopes it was previously reported to recognize in both cancer and other disease settings.</p>
</sec>
</sec>
<sec id="s3" sec-type="discussion">
<title>Discussion</title>
<p>Here we present our vision and &#x201c;blueprint&#x201d; to design and implement the Cancer Epitope Database and Analysis Resource (CEDAR), which will provide a comprehensive collection of cancer epitopes curated from the literature, as well as cancer epitope prediction and analysis tools. CEDAR will leverage our decades of experience from the development of the IEDB, which is fully operational and has been funded since 2003 through a contract from NIAID, with an extension to 2025. The IEDB focuses on allergy, infectious disease, transplantation, and autoimmunity but excludes cancer. Of note, the current <xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f3">
<bold>3</bold>
</xref> reflect the initial prototype based on the direct result of the input received in the initial planning stages by our panel of experts. We however expect that these will evolve over time as the prototypes are implemented and additional feedback is received.</p>
<p>It is now well recognized that understanding the nature of cancer epitopes and their cognate receptors enables us to answer important scientific questions. For example, researchers are examining how the mutation and epitope load in a given tumor relate to the success of checkpoint blockade treatments (<xref ref-type="bibr" rid="B4">4</xref>). In addition to this, current research explores epitope-based vaccines and the transfer of epitope-specific T cells and TCRs for use in personalized therapies (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B59">59</xref>, <xref ref-type="bibr" rid="B60">60</xref>). Epitopes recognized across different individuals provide ideal targets for more cost-effective, off-the-shelf immunotherapies, re-igniting interest in tumor-associated antigens. While mutation-based neoantigens have received considerable attention in recent years, the CEDAR initiative will also curate all data related to cancer-specific but non-mutated antigens, e.g. based on cancer-specific protein expression and processing variations, or cryptic antigens.</p>
<p>This interest is not limited to T cells, as several therapies also take advantage of defined antibodies and BCRs. Moreover, the ability to readily sequence TCRs and BCRs through single-cell sequencing studies of tumor tissues has provided an impetus to develop tools that facilitate the identification of tumor-specific T cells and B cells in these samples. To address these needs, CEDAR will provide a central, freely accessible catalog of cancer epitope and receptor data linked to the biological, immunological, and clinical contexts in which they were described. The ultimate goal is to come &#x201c;full circle&#x201d; and link epitope recognition and immunological readouts to outcomes of disease, treatment, and vaccination. We also aim to use these data to develop and evaluate machine learning-based epitope and TCR/BCR specificity prediction tools for the analysis resource component of CEDAR.</p>
<p>The CEDAR website will initially be developed based on our experience in translational cancer research, as well as feedback obtained from a diverse set of cancer experts. The website will enable intuitive and scientifically accurate cancer-specific queries and reports. This will be implemented by leveraging the existing IEDB database, curation, and query and reporting infrastructure, and expanding it to represent clinical and disease phenotypes beyond what is currently in the IEDB. Additional fields relevant to cancer will be accurately captured, such as different forms and histologies of cancer and associated immunological, biological, and clinical information. Based on our preliminary data, the modifications required in the IEDB infrastructure to enable CEDAR can be implemented in a period of 12 months. Once established, subsequent modifications to CEDAR will be driven by broader community feedback.</p>
<p>Curation of immune epitope data from literature, relevant to cancer immunology, will include B and T cell epitopes associated with cancer antigens, and in particular, naturally processed and presented epitopes recognized in the context of a tumor, such as the ones recognized by tumor-infiltrating lymphocytes. Epitope data gathered in immunotherapy studies, in human clinical trials and animal models, will also be captured along with the sequences of both naturally occurring and engineered cancer epitope-specific TCRs and BCRs.</p>
<p>Data related to cancer-specific HLA ligandomics analysis by mass spectrometry will also be prominently curated and displayed, as well as data demonstrating epitopes&#x2019; natural presentation on tumor cells. Currently, natural ligand data is already curated in the IEDB, and more than 872,001 eluted ligands are curated and accessible through the IEDB website. These data together with any cancer-specific data will be accessible through both the IEDB and CEDAR webpages.</p>
<p>The granular curation of the data and the flexible query structure of CEDAR will allow the user to extract the data most relevant for different queries. For example data related to natural presentation or recognition of tumor targets is arguably the most important whenever available, whereas recognition of synthetic antigens by T cells has frequently led to false positive results. The flexible query structure of CEDAR will allow to retrieve data related to either natural presentation, recognition of synthetic antigens or both.</p>
<p>CEDAR will curate all cancer epitope data obtained either <italic>in vivo</italic> or <italic>in vitro</italic>. Tumor rejection or tumor control data is one of the measures of activity of cancer epitopes and will be curated as such where available. Indeed, several studies have published data in mouse models and human clinical trials where the ability of individual cancer epitopes has been tested <italic>in vivo</italic> (<xref ref-type="bibr" rid="B61">61</xref>&#x2013;<xref ref-type="bibr" rid="B65">65</xref>). Arguably, this is the most significant activity of a cancer epitope. A number of studies also previously reported T cell responses against cancer epitopes <italic>in vitro</italic>, which however did not result in clinical activity when tested <italic>in vivo</italic> (<xref ref-type="bibr" rid="B66">66</xref>&#x2013;<xref ref-type="bibr" rid="B68">68</xref>). Furthermore, human studies (<xref ref-type="bibr" rid="B69">69</xref>, <xref ref-type="bibr" rid="B70">70</xref>) and mouse studies (<xref ref-type="bibr" rid="B71">71</xref>, <xref ref-type="bibr" rid="B72">72</xref>) have highlighted contradictions in the data on neoepitope recognition. As CEDAR will include data from both, <italic>in vitro</italic> and <italic>in vivo</italic> experiments, it will be possible to analyze any correlations between T and B cell responses <italic>in vitro</italic> and associated antitumor efficacy <italic>in vivo.</italic>
</p>
<p>To the best of our knowledge, CEDAR would provide the first comprehensive and curated cancer epitope database in which the biological, immunological, and clinical context is captured with high granularity and is retrievable for analysis with ease and accuracy. Currently, none of the available repositories capture comprehensive cancer epitope information with the necessary granularity. CEDAR will provide query and reporting strategies specifically designed to meet the needs of cancer researchers to make cancer epitope data and metadata accessible. These strategies are designed specifically for CEDAR and will be developed in a timely and cost-effective manner, relying on the existing IEDB infrastructure, which is based on over 18 years of work experience and development.</p>
<p>Large efforts have been dedicated to developing novel approaches for improved prediction and/or identification of cancer neoepitopes (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B56">56</xref>, <xref ref-type="bibr" rid="B73">73</xref>&#x2013;<xref ref-type="bibr" rid="B77">77</xref>). Each of these efforts proposed different features to complement HLA binding prediction to improve the ability of identifying cancer neoepitopes. However, these studies are highly heterogeneous in terms of data generation, validation techniques, and the generality of the obtained conclusions, further challenged by an often very limited sample size. The Tumor Neoantigen Selection Alliance (TESLA) has provided an attempt to address these issues by generating uniform data sets to be used by the community for prediction of neoepitope candidates with subsequent experimental validation (<xref ref-type="bibr" rid="B49">49</xref>). The main conclusion from this work was that immunogenic tumor epitopes &#x2018;are those tumor peptides that have strong MHC binding affinity and long half-life, are expressed highly and have either low agretopicity or high foreignness&#x2019; (<xref ref-type="bibr" rid="B49">49</xref>).</p>
<p>CEDAR will further this kind of analysis and provide a validated set of cancer epitope prediction and analysis tools. Users will have access to implementations for published tools that currently have no web-accessible versions and, objective and transparent benchmarks of all tools will be performed using literature data that becomes available in CEDAR through ongoing curation efforts. In line with what has been the case for general T cell epitope prediction tools, the availability of comprehensive datasets within the IEDB and benchmarking has been pivotal for the identification of well-performing tools, excluding anecdotal results. Similarly, we expect that these properties of CEDAR will allow users to identify none-dataset specific properties and help move the field of cancer neoepitope prediction forward. Finally, new tools will be developed based&#xa0;on&#xa0;lessons learned from the benchmarks that include cancer-specific considerations, such as gene expression. Additionally, we aim to provide a tool that will compare the mutant and wildtype sequences in terms of their ability to bind cognate HLA molecules and trigger T cell responses when evaluating immunogenicity.</p>
<p>We will greatly expand the development, hosting, and availability of different strategies to predict the immunogenicity and clinical efficacy of cancer epitopes, as well as their potential as a surrogate marker of positive clinical evolution following cancer treatments. The availability of large, curated cancer epitope datasets, reference implementations of prediction approaches, and clear metrics of success is necessary to inform both the community of tool developers on what makes a tool useful and the community of tool users on which tool to use for their application. Users will be provided with unbiased, objective, and transparent evaluations of different epitope prediction tools side-by-side, with the code being made publicly available. Cross-comparison of prediction approaches on epitope datasets derived from cancer <italic>versus</italic> other diseases (infection, allergy, autoimmunity) will determine if there are predictable features of cancer epitopes that differentiate them from other epitopes.</p>
<p>As the CEDAR data will be hosted side-by-side with IEDB data, the resulting combined dataset will encompass all known epitopes and their TCRs and BCRs, regardless of disease context. This dataset will enable highly innovative analyses, namely the ability to identify TCR and BCR sequences with known (or inferred) epitope specificity from repertoire sequencing data. With the increasing ease of isolating and sequencing TCRs, the identified repertoire can be compared to the continuously growing database of known TCR:epitope:MHC interactions. This will allow identification of TCRs in tumor-associated T cells targeting known neoepitopes or tumor-associated antigens, as well as TCRs targeting viral epitopes (<xref ref-type="bibr" rid="B60">60</xref>, <xref ref-type="bibr" rid="B78">78</xref>, <xref ref-type="bibr" rid="B79">79</xref>). Some studies have reported enrichment of TCRs that recognize viral epitopes in TIL that could be cross-reactive, as well as TCRs capable of recognizing unmutated self-peptides expressed in normal tissue (<xref ref-type="bibr" rid="B80">80</xref>, <xref ref-type="bibr" rid="B81">81</xref>), which could result in autoimmune side-effects of checkpoint blockade treatments. Ultimately, CEDAR will prove to be a powerful resource for the cancer community and will help advance cancer research and the development of effective cancer therapies.</p>
</sec>
<sec id="s4" sec-type="data-availability">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s5">
<title>Author Contributions</title>
<p>ZK-Y, NB, AS, and BP prepared the manuscript. HC, MN, EZ, DK, JC-G, PR, and SPS reviewed and edited the manuscript. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="s6" sec-type="funding-information">
<title>Funding</title>
<p>Research reported in this publication was supported by the National Cancer Institute of the National Institutes of Health under award numbers U24CA248138 and U01DE028227.</p>
</sec>
<sec id="s7">
<title>Author Disclaimer</title>
<p>The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health.</p>
</sec>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abelin</surname> <given-names>JG</given-names>
</name>
<name>
<surname>Keskin</surname> <given-names>DB</given-names>
</name>
<name>
<surname>Sarkizova</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hartigan</surname> <given-names>CR</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W</given-names>
</name>
<name>
<surname>Sidney</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Mass Spectrometry Profiling of HLA-Associated Peptidomes in Mono-Allelic Cells Enables More Accurate Epitope Prediction</article-title>. <source>Immunity</source> (<year>2017</year>) <volume>46</volume>:<page-range>315&#x2013;26</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.immuni.2017.02.007</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zamora</surname> <given-names>AE</given-names>
</name>
<name>
<surname>Crawford</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Thomas</surname> <given-names>PG</given-names>
</name>
</person-group>. <article-title>Hitting the Target: How T Cells Detect and Eliminate Tumors</article-title>. <source>J Immunol</source> (<year>2018</year>) <volume>200</volume>:<page-range>392&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.4049/jimmunol.1701413</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Topalian</surname> <given-names>SL</given-names>
</name>
<name>
<surname>Drake</surname> <given-names>CG</given-names>
</name>
<name>
<surname>Pardoll</surname> <given-names>DM</given-names>
</name>
</person-group>. <article-title>Immune Checkpoint Blockade: A Common Denominator Approach to Cancer Therapy</article-title>. <source>Cancer Cell</source> (<year>2015</year>) <volume>27</volume>:<page-range>450&#x2013;61</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.ccell.2015.03.001</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schumacher</surname> <given-names>TN</given-names>
</name>
<name>
<surname>Scheper</surname> <given-names>W</given-names>
</name>
<name>
<surname>Kvistborg</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Cancer Neoantigens</article-title>. <source>Annu Rev Immunol</source> (<year>2019</year>) <volume>37</volume>:<fpage>173</fpage>&#x2013;<lpage>200</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev-immunol-042617-053402</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Curran</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Glisson</surname> <given-names>BS</given-names>
</name>
</person-group>. <article-title>New Hope for Therapeutic Cancer Vaccines in the Era of Immune Checkpoint Modulation</article-title>. <source>Annu Rev Med</source> (<year>2019</year>) <volume>70</volume>:<page-range>409&#x2013;24</page-range>. doi: <pub-id pub-id-type="doi">10.1146/annurev-med-050217-121900</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Topalian</surname> <given-names>SL</given-names>
</name>
<name>
<surname>Taube</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Pardoll</surname> <given-names>DM</given-names>
</name>
</person-group>. <article-title>Neoadjuvant Checkpoint Blockade for Cancer Immunotherapy</article-title>. <source>Science</source> (<year>2020</year>) <volume>367</volume>(<issue>6477</issue>):<page-range>eaax0182</page-range>. doi: <pub-id pub-id-type="doi">10.1126/science.aax0182</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>G</given-names>
</name>
<name>
<surname>Chitkushev</surname> <given-names>L</given-names>
</name>
<name>
<surname>Olsen</surname> <given-names>LR</given-names>
</name>
<name>
<surname>Keskin</surname> <given-names>DB</given-names>
</name>
<name>
<surname>Brusic</surname> <given-names>V</given-names>
</name>
</person-group>. <article-title>TANTIGEN 2.0: A Knowledge Base of Tumor T Cell Antigens and Epitopes</article-title>. <source>BMC Bioinf</source> (<year>2021</year>) <volume>22</volume>:<fpage>40</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12859-021-03962-7</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xia</surname> <given-names>J</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>P</given-names>
</name>
<name>
<surname>Fan</surname> <given-names>W</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>NEPdb: A Database of T-Cell Experimentally-Validated Neoantigens and Pan-Cancer Predicted Neoepitopes for Cancer Immunotherapy</article-title>. <source>Front Immunol</source> (<year>2021</year>) <volume>12</volume>:<elocation-id>644637</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fimmu.2021.644637</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tan</surname> <given-names>X</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>P</given-names>
</name>
<name>
<surname>Jian</surname> <given-names>X</given-names>
</name>
<name>
<surname>Wan</surname> <given-names>H</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>G</given-names>
</name>
<etal/>
</person-group>. <article-title>Dbpepneo: A Manually Curated Database for Human Tumor Neoantigen Peptides</article-title>. <source>Database (Oxf)</source> (<year>2020</year>) <volume>2020</volume>:<fpage>1</fpage>&#x2013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1093/database/baaa004</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vita</surname> <given-names>R</given-names>
</name>
<name>
<surname>Mahajan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Overton</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Dhanda</surname> <given-names>SK</given-names>
</name>
<name>
<surname>Martini</surname> <given-names>S</given-names>
</name>
<name>
<surname>Cantrell</surname> <given-names>JR</given-names>
</name>
<etal/>
</person-group>. <article-title>The Immune Epitope Database (IEDB): 2018 Update</article-title>. <source>Nucleic Acids Res</source> (<year>2019</year>) <volume>47</volume>:<page-range>D339&#x2013;43</page-range>. doi: <pub-id pub-id-type="doi">10.1093/nar/gky1006</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gartner</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Parkhurst</surname> <given-names>MR</given-names>
</name>
<name>
<surname>Gros</surname> <given-names>A</given-names>
</name>
<name>
<surname>Tran</surname> <given-names>E</given-names>
</name>
<name>
<surname>Jafferji</surname> <given-names>MS</given-names>
</name>
<name>
<surname>Copeland</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>A Machine Learning Model for Ranking Candidate HLA Class I Neoantigens Based on Known Neoepitopes From Multiple Human Tumor Types</article-title>. <source>Nat Cancer</source> (<year>2021</year>) <volume>2</volume>:<fpage>1</fpage>&#x2013;<lpage>12</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s43018-021-00197-6</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hastings</surname> <given-names>J</given-names>
</name>
<name>
<surname>Owen</surname> <given-names>G</given-names>
</name>
<name>
<surname>Dekker</surname> <given-names>A</given-names>
</name>
<name>
<surname>Ennis</surname> <given-names>M</given-names>
</name>
<name>
<surname>Kale</surname> <given-names>N</given-names>
</name>
<name>
<surname>Muthukrishnan</surname> <given-names>V</given-names>
</name>
<etal/>
</person-group>. <article-title>ChEBI in 2016: Improved Services and an Expanding Collection of Metabolites</article-title>. <source>Nucleic Acids Res</source> (<year>2016</year>) <volume>44</volume>:<page-range>D1214&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkv1031</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>S</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>T</given-names>
</name>
<name>
<surname>Gindulyte</surname> <given-names>A</given-names>
</name>
<name>
<surname>He</surname> <given-names>J</given-names>
</name>
<name>
<surname>He</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>PubChem 2019 Update: Improved Access to Chemical Data</article-title>. <source>Nucleic Acids Res</source> (<year>2019</year>) <volume>47</volume>:<page-range>D1102&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.1093/nar/gky1033</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname> <given-names>CC</given-names>
</name>
<name>
<surname>Selitsky</surname> <given-names>SR</given-names>
</name>
<name>
<surname>Chai</surname> <given-names>S</given-names>
</name>
<name>
<surname>Armistead</surname> <given-names>PM</given-names>
</name>
<name>
<surname>Vincent</surname> <given-names>BG</given-names>
</name>
<name>
<surname>Serody</surname> <given-names>JS</given-names>
</name>
</person-group>. <article-title>Alternative Tumour-Specific Antigens</article-title>. <source>Nat Rev Cancer</source> (<year>2019</year>) <volume>19</volume>:<page-range>465&#x2013;78</page-range>. doi: <pub-id pub-id-type="doi">10.1038/s41568-019-0162-4</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Uhlen</surname> <given-names>M</given-names>
</name>
<name>
<surname>Fagerberg</surname> <given-names>L</given-names>
</name>
<name>
<surname>Hallstrom</surname> <given-names>BM</given-names>
</name>
<name>
<surname>Lindskog</surname> <given-names>C</given-names>
</name>
<name>
<surname>Oksvold</surname> <given-names>P</given-names>
</name>
<name>
<surname>Mardinoglu</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Proteomics. Tissue-Based Map of the Human Proteome</article-title>. <source>Science</source> (<year>2015</year>) <volume>347</volume>:<fpage>1260419</fpage>. doi: <pub-id pub-id-type="doi">10.1126/science.1260419</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>The Gene Ontology</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>The Gene Ontology Resource: 20 Years and Still GOing Strong</article-title>. <source>Nucleic Acids Res</source> (<year>2019</year>) <volume>47</volume>:<page-range>D330&#x2013;8</page-range>. doi: <pub-id pub-id-type="doi">10.1093/nar/gky1055</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ashburner</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ball</surname> <given-names>CA</given-names>
</name>
<name>
<surname>Blake</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Botstein</surname> <given-names>D</given-names>
</name>
<name>
<surname>Butler</surname> <given-names>H</given-names>
</name>
<name>
<surname>Cherry</surname> <given-names>JM</given-names>
</name>
<etal/>
</person-group>. <article-title>Gene Ontology: Tool for the Unification of Biology. The Gene Ontology Consortium</article-title>. <source>Nat Genet</source> (<year>2000</year>) <volume>25</volume>:<page-range>25&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.1038/75556</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cancer Genome Atlas Research</surname> <given-names>N</given-names>
</name>
<name>
<surname>Weinstein</surname> <given-names>JN</given-names>
</name>
<name>
<surname>Collisson</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Mills</surname> <given-names>GB</given-names>
</name>
<name>
<surname>Shaw</surname> <given-names>KR</given-names>
</name>
<name>
<surname>Ozenberger</surname> <given-names>BA</given-names>
</name>
<etal/>
</person-group>. <article-title>The Cancer Genome Atlas Pan-Cancer Analysis Project</article-title>. <source>Nat Genet</source> (<year>2013</year>) <volume>45</volume>:<page-range>1113&#x2013;20</page-range>. doi: <pub-id pub-id-type="doi">10.1038/ng.2764</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cerami</surname> <given-names>E</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Dogrusoz</surname> <given-names>U</given-names>
</name>
<name>
<surname>Gross</surname> <given-names>BE</given-names>
</name>
<name>
<surname>Sumer</surname> <given-names>SO</given-names>
</name>
<name>
<surname>Aksoy</surname> <given-names>BA</given-names>
</name>
<etal/>
</person-group>. <article-title>The Cbio Cancer Genomics Portal: An Open Platform for Exploring Multidimensional Cancer Genomics Data</article-title>. <source>Cancer Discov</source> (<year>2012</year>) <volume>2</volume>:<page-range>401&#x2013;4</page-range>. doi: <pub-id pub-id-type="doi">10.1158/2159-8290.CD-12-0095</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ghandi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>FW</given-names>
</name>
<name>
<surname>Jane-Valbuena</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kryukov</surname> <given-names>GV</given-names>
</name>
<name>
<surname>Lo</surname> <given-names>CC</given-names>
</name>
<name>
<surname>McDonald</surname> <given-names>ER</given-names>
<suffix>3rd</suffix>
</name>
<etal/>
</person-group>. <article-title>Next-Generation Characterization of the Cancer Cell Line Encyclopedia</article-title>. <source>Nature</source> (<year>2019</year>) <volume>569</volume>:<page-range>503&#x2013;8</page-range>. doi: <pub-id pub-id-type="doi">10.1038/s41586-019-1186-3</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reva</surname> <given-names>B</given-names>
</name>
<name>
<surname>Antipin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Sander</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Predicting the Functional Impact of Protein Mutations: Application to Cancer Genomics</article-title>. <source>Nucleic Acids Res</source> (<year>2011</year>) <volume>39</volume>:<fpage>e118</fpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkr407</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tokheim</surname> <given-names>C</given-names>
</name>
<name>
<surname>Karchin</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>CHASMplus Reveals the Scope of Somatic Missense Mutations Driving Human Cancers</article-title>. <source>Cell Syst</source> (<year>2019</year>) <volume>9</volume>:<fpage>9</fpage>&#x2013;<lpage>23.e8</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cels.2019.05.005</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Klausen</surname> <given-names>MS</given-names>
</name>
<name>
<surname>Jespersen</surname> <given-names>MC</given-names>
</name>
<name>
<surname>Nielsen</surname> <given-names>H</given-names>
</name>
<name>
<surname>Jensen</surname> <given-names>KK</given-names>
</name>
<name>
<surname>Jurtz</surname> <given-names>VI</given-names>
</name>
<name>
<surname>Sonderby</surname> <given-names>CK</given-names>
</name>
<etal/>
</person-group>. <article-title>NetSurfP-2.0: Improved Prediction of Protein Structural Features by Integrated Deep Learning</article-title>. <source>Proteins</source> (<year>2019</year>) <volume>87</volume>:<page-range>520&#x2013;7</page-range>. doi: <pub-id pub-id-type="doi">10.1002/prot.25674</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sigrist</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>de Castro</surname> <given-names>E</given-names>
</name>
<name>
<surname>Cerutti</surname> <given-names>L</given-names>
</name>
<name>
<surname>Cuche</surname> <given-names>BA</given-names>
</name>
<name>
<surname>Hulo</surname> <given-names>N</given-names>
</name>
<name>
<surname>Bridge</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>New and Continuing Developments at PROSITE</article-title>. <source>Nucleic Acids Res</source> (<year>2013</year>) <volume>41</volume>:<page-range>D344&#x2013;7</page-range>. doi: <pub-id pub-id-type="doi">10.1093/nar/gks1067</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wilkinson</surname> <given-names>MD</given-names>
</name>
<name>
<surname>Dumontier</surname> <given-names>M</given-names>
</name>
<name>
<surname>Aalbersberg</surname> <given-names>IJ</given-names>
</name>
<name>
<surname>Appleton</surname> <given-names>G</given-names>
</name>
<name>
<surname>Axton</surname> <given-names>M</given-names>
</name>
<name>
<surname>Baak</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>The FAIR Guiding Principles for Scientific Data Management and Stewardship</article-title>. <source>Sci Data</source> (<year>2016</year>) <volume>3</volume>:<fpage>160018</fpage>. doi: <pub-id pub-id-type="doi">10.1038/sdata.2016.18</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vita</surname> <given-names>R</given-names>
</name>
<name>
<surname>Overton</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Mungall</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>Sette</surname> <given-names>A</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>FAIR Principles and the IEDB: Short-Term Improvements and a Long-Term Vision of OBO-Foundry Mediated Machine-Actionable Interoperability</article-title>. <source>Database (Oxford)</source> (<year>2018</year>) <volume>2018</volume>. doi: <pub-id pub-id-type="doi">10.1093/database/bax105</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schriml</surname> <given-names>LM</given-names>
</name>
<name>
<surname>Mitraka</surname> <given-names>E</given-names>
</name>
<name>
<surname>Munro</surname> <given-names>J</given-names>
</name>
<name>
<surname>Tauber</surname> <given-names>B</given-names>
</name>
<name>
<surname>Schor</surname> <given-names>M</given-names>
</name>
<name>
<surname>Nickle</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>Human Disease Ontology 2018 Update: Classification, Content and Workflow Expansion</article-title>. <source>Nucleic Acids Res</source> (<year>2019</year>) <volume>47</volume>:<page-range>D955&#x2013;62</page-range>. doi: <pub-id pub-id-type="doi">10.1093/nar/gky1032</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fragoso</surname> <given-names>G</given-names>
</name>
<name>
<surname>de Coronado</surname> <given-names>S</given-names>
</name>
<name>
<surname>Haber</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hartel</surname> <given-names>F</given-names>
</name>
<name>
<surname>Wright</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Overview and Utilization of the NCI Thesaurus</article-title>. <source>Comp Funct Genomics</source> (<year>2004</year>) <volume>5</volume>:<page-range>648&#x2013;54</page-range>. doi: <pub-id pub-id-type="doi">10.1002/cfg.445</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>P</given-names>
</name>
<name>
<surname>Morgan</surname> <given-names>AA</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Sette</surname> <given-names>A</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>Automating Document Classification for the Immune Epitope Database</article-title>. <source>BMC Bioinf</source> (<year>2007</year>) <volume>8</volume>:<fpage>269</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2105-8-269</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vita</surname> <given-names>R</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
<name>
<surname>Sette</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>The Curation Guidelines of the Immune Epitope Database and Analysis Resource</article-title>. <source>Cytometry A</source> (<year>2008</year>) <volume>73</volume>:<page-range>1066&#x2013;70</page-range>. doi: <pub-id pub-id-type="doi">10.1002/cyto.a.20585</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davies</surname> <given-names>V</given-names>
</name>
<name>
<surname>Vaughan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Damle</surname> <given-names>R</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
<name>
<surname>Sette</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Classification of the Universe of Immune Epitope Literature: Representation and Knowledge Gaps</article-title>. <source>PloS One</source> (<year>2009</year>) <volume>4</volume>:<fpage>e6948</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0006948</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vita</surname> <given-names>R</given-names>
</name>
<name>
<surname>Vaughan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Zarebski</surname> <given-names>L</given-names>
</name>
<name>
<surname>Salimi</surname> <given-names>N</given-names>
</name>
<name>
<surname>Fleri</surname> <given-names>W</given-names>
</name>
<name>
<surname>Grey</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Curation of Complex, Context-Dependent Immunological Data</article-title>. <source>BMC Bioinf</source> (<year>2006</year>) <volume>7</volume>:<fpage>341</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2105-7-341</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salimi</surname> <given-names>N</given-names>
</name>
<name>
<surname>Vita</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>The Biocurator: Connecting and Enhancing Scientific Data</article-title>. <source>PloS Comput Biol</source> (<year>2006</year>) <volume>2</volume>:<fpage>e125</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pcbi.0020125</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fleri</surname> <given-names>W</given-names>
</name>
<name>
<surname>Vaughan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Salimi</surname> <given-names>N</given-names>
</name>
<name>
<surname>Vita</surname> <given-names>R</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
<name>
<surname>Sette</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>The Immune Epitope Database: How Data Are Entered and Retrieved</article-title>. <source>J Immunol Res</source> (<year>2017</year>) <volume>2017</volume>:<fpage>5974574</fpage>. doi: <pub-id pub-id-type="doi">10.1155/2017/5974574</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahajan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Vita</surname> <given-names>R</given-names>
</name>
<name>
<surname>Shackelford</surname> <given-names>D</given-names>
</name>
<name>
<surname>Lane</surname> <given-names>J</given-names>
</name>
<name>
<surname>Schulten</surname> <given-names>V</given-names>
</name>
<name>
<surname>Zarebski</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>Epitope Specific Antibodies and T Cell Receptors in the Immune Epitope Database</article-title>. <source>Front Immunol</source> (<year>2018</year>) <volume>9</volume>:<elocation-id>2688</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fimmu.2018.02688</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seymour</surname> <given-names>E</given-names>
</name>
<name>
<surname>Damle</surname> <given-names>R</given-names>
</name>
<name>
<surname>Sette</surname> <given-names>A</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>Cost Sensitive Hierarchical Document Classification to Triage PubMed Abstracts for Manual Curation</article-title>. <source>BMC Bioinf</source> (<year>2011</year>) <volume>12</volume>:<fpage>482</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2105-12-482</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="book">
<person-group person-group-type="author">
<collab>IEDB</collab>
</person-group>. <source>Curation Manual 2.0</source>. (<year>2007</year>). Available at: <uri xlink:href="http://curationwiki.iedb.org/wiki/index.php/Curation_Manual2.0">http://curationwiki.iedb.org/wiki/index.php/Curation_Manual2.0</uri>
</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Richters</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>H</given-names>
</name>
<name>
<surname>Campbell</surname> <given-names>KM</given-names>
</name>
<name>
<surname>Gillanders</surname> <given-names>WE</given-names>
</name>
<name>
<surname>Griffith</surname> <given-names>OL</given-names>
</name>
<name>
<surname>Griffith</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Best Practices for Bioinformatic Characterization of Neoantigens for Clinical Utility</article-title>. <source>Genome Med</source> (<year>2019</year>) <volume>11</volume>:<fpage>56</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13073-019-0666-2</pub-id>
</citation>
</ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Trolle</surname> <given-names>T</given-names>
</name>
<name>
<surname>Metushi</surname> <given-names>IG</given-names>
</name>
<name>
<surname>Greenbaum</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Sidney</surname> <given-names>J</given-names>
</name>
<name>
<surname>Lund</surname> <given-names>O</given-names>
</name>
<etal/>
</person-group>. <article-title>Automated Benchmarking of Peptide-MHC Class I Binding Predictions</article-title>. <source>Bioinformatics</source> (<year>2015</year>) <volume>31</volume>:<page-range>2174&#x2013;81</page-range>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btv123</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andreatta</surname> <given-names>M</given-names>
</name>
<name>
<surname>Trolle</surname> <given-names>T</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Greenbaum</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
<name>
<surname>Nielsen</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>An Automated Benchmarking Platform for MHC Class II Binding Prediction Methods</article-title>. <source>Bioinformatics</source> (<year>2018</year>) <volume>34</volume>:<page-range>1522&#x2013;8</page-range>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btx820</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kosaloglu-Yalcin</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Lanka</surname> <given-names>M</given-names>
</name>
<name>
<surname>Frentzen</surname> <given-names>A</given-names>
</name>
<name>
<surname>Logandha Ramamoorthy Premlal</surname> <given-names>A</given-names>
</name>
<name>
<surname>Sidney</surname> <given-names>J</given-names>
</name>
<name>
<surname>Vaughan</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>Predicting T Cell Recognition of MHC Class I Restricted Neoepitopes</article-title>. <source>Oncoimmunology</source> (<year>2018</year>) <volume>7</volume>:<fpage>e1492508</fpage>. doi: <pub-id pub-id-type="doi">10.1080/2162402X.2018.1492508</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname> <given-names>J</given-names>
</name>
<name>
<surname>Aksoy</surname> <given-names>BA</given-names>
</name>
<name>
<surname>Dogrusoz</surname> <given-names>U</given-names>
</name>
<name>
<surname>Dresdner</surname> <given-names>G</given-names>
</name>
<name>
<surname>Gross</surname> <given-names>B</given-names>
</name>
<name>
<surname>Sumer</surname> <given-names>SO</given-names>
</name>
<etal/>
</person-group>. <article-title>Integrative Analysis of Complex Cancer Genomics and Clinical Profiles Using the Cbioportal</article-title>. <source>Sci Signal</source> (<year>2013</year>) <volume>6</volume>:<fpage>pl1</fpage>. doi: <pub-id pub-id-type="doi">10.1126/scisignal.2004088</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grossman</surname> <given-names>RL</given-names>
</name>
<name>
<surname>Heath</surname> <given-names>AP</given-names>
</name>
<name>
<surname>Ferretti</surname> <given-names>V</given-names>
</name>
<name>
<surname>Varmus</surname> <given-names>HE</given-names>
</name>
<name>
<surname>Lowy</surname> <given-names>DR</given-names>
</name>
<name>
<surname>Kibbe</surname> <given-names>WA</given-names>
</name>
<etal/>
</person-group>. <article-title>Toward a Shared Vision for Cancer Genomic Data</article-title>. <source>N Engl J Med</source> (<year>2016</year>) <volume>375</volume>:<page-range>1109&#x2013;12</page-range>. doi: <pub-id pub-id-type="doi">10.1056/NEJMp1607591</pub-id>
</citation>
</ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Richman</surname> <given-names>LP</given-names>
</name>
<name>
<surname>Vonderheide</surname> <given-names>RH</given-names>
</name>
<name>
<surname>Rech</surname> <given-names>AJ</given-names>
</name>
</person-group>. <article-title>Neoantigen Dissimilarity to the Self-Proteome Predicts Immunogenicity and Response to Immune Checkpoint Blockade</article-title>. <source>Cell Syst</source> (<year>2019</year>) <volume>9</volume>:<fpage>375</fpage>&#x2013;<lpage>82.e4</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cels.2019.08.009</pub-id>
</citation>
</ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>S</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>E</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>MG</given-names>
</name>
<name>
<surname>Shin</surname> <given-names>EC</given-names>
</name>
<name>
<surname>Paik</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Neopepsee: Accurate Genome-Level Prediction of Neoantigens by Harnessing Sequence and Amino Acid Immunogenicity Information</article-title>. <source>Ann Oncol</source> (<year>2018</year>) <volume>29</volume>:<page-range>1030&#x2013;6</page-range>. doi: <pub-id pub-id-type="doi">10.1093/annonc/mdy022</pub-id>
</citation>
</ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parkhurst</surname> <given-names>MR</given-names>
</name>
<name>
<surname>Robbins</surname> <given-names>PF</given-names>
</name>
<name>
<surname>Tran</surname> <given-names>E</given-names>
</name>
<name>
<surname>Prickett</surname> <given-names>TD</given-names>
</name>
<name>
<surname>Gartner</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>Unique Neoantigens Arise From Somatic Mutations in Patients With Gastrointestinal Cancers</article-title>. <source>Cancer Discov</source> (<year>2019</year>) <volume>9</volume>:<page-range>1022&#x2013;35</page-range>. doi: <pub-id pub-id-type="doi">10.1158/2159-8290.CD-18-1494</pub-id>
</citation>
</ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kreiter</surname> <given-names>S</given-names>
</name>
<name>
<surname>Vormehr</surname> <given-names>M</given-names>
</name>
<name>
<surname>van de Roemer</surname> <given-names>N</given-names>
</name>
<name>
<surname>Diken</surname> <given-names>M</given-names>
</name>
<name>
<surname>Lower</surname> <given-names>M</given-names>
</name>
<name>
<surname>Diekmann</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Erratum: Mutant MHC Class II Epitopes Drive Therapeutic Immune Responses to Cancer</article-title>. <source>Nature</source> (<year>2015</year>) <volume>523</volume>:<fpage>370</fpage>. doi: <pub-id pub-id-type="doi">10.1038/nature14567</pub-id>
</citation>
</ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Granados</surname> <given-names>DP</given-names>
</name>
<name>
<surname>Yahyaoui</surname> <given-names>W</given-names>
</name>
<name>
<surname>Laumont</surname> <given-names>CM</given-names>
</name>
<name>
<surname>Daouda</surname> <given-names>T</given-names>
</name>
<name>
<surname>Muratore-Schroeder</surname> <given-names>TL</given-names>
</name>
<name>
<surname>Cote</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>MHC I-Associated Peptides Preferentially Derive From Transcripts Bearing miRNA Response Elements</article-title>. <source>Blood</source> (<year>2012</year>) <volume>119</volume>:<page-range>e181&#x2013;91</page-range>. doi: <pub-id pub-id-type="doi">10.1182/blood-2012-02-412593</pub-id>
</citation>
</ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wells</surname> <given-names>DK</given-names>
</name>
<name>
<surname>van Buuren</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Dang</surname> <given-names>KK</given-names>
</name>
<name>
<surname>Hubbard-Lucey</surname> <given-names>VM</given-names>
</name>
<name>
<surname>Sheehan</surname> <given-names>KCF</given-names>
</name>
<name>
<surname>Campbell</surname> <given-names>KM</given-names>
</name>
<etal/>
</person-group>. <article-title>Key Parameters of Tumor Epitope Immunogenicity Revealed Through a Consortium Approach Improve Neoantigen Prediction</article-title>. <source>Cell</source> (<year>2020</year>) <volume>183</volume>:<fpage>818</fpage>&#x2013;<lpage>34.e13</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2020.09.015</pub-id>
</citation>
</ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sarkizova</surname> <given-names>S</given-names>
</name>
<name>
<surname>Klaeger</surname> <given-names>S</given-names>
</name>
<name>
<surname>Le</surname> <given-names>PM</given-names>
</name>
<name>
<surname>Li</surname> <given-names>LW</given-names>
</name>
<name>
<surname>Oliveira</surname> <given-names>G</given-names>
</name>
<name>
<surname>Keshishian</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>A Large Peptidome Dataset Improves HLA Class I Epitope Prediction Across Most of the Human Population</article-title>. <source>Nat Biotechnol</source> (<year>2020</year>) <volume>38</volume>:<fpage>199</fpage>&#x2013;<lpage>209</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41587-019-0322-9</pub-id>
</citation>
</ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bresciani</surname> <given-names>A</given-names>
</name>
<name>
<surname>Paul</surname> <given-names>S</given-names>
</name>
<name>
<surname>Schommer</surname> <given-names>N</given-names>
</name>
<name>
<surname>Dillon</surname> <given-names>MB</given-names>
</name>
<name>
<surname>Bancroft</surname> <given-names>T</given-names>
</name>
<name>
<surname>Greenbaum</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>T-Cell Recognition Is Shaped by Epitope Sequence Conservation in the Host Proteome and Microbiome</article-title>. <source>Immunology</source> (<year>2016</year>) <volume>148</volume>:<page-range>34&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.1111/imm.12585</pub-id>
</citation>
</ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bjerregaard</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Nielsen</surname> <given-names>M</given-names>
</name>
<name>
<surname>Jurtz</surname> <given-names>V</given-names>
</name>
<name>
<surname>Barra</surname> <given-names>CM</given-names>
</name>
<name>
<surname>Hadrup</surname> <given-names>SR</given-names>
</name>
<name>
<surname>Szallasi</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>An Analysis of Natural T Cell Responses to Predicted Tumor Neoepitopes</article-title>. <source>Front Immunol</source> (<year>2017</year>) <volume>8</volume>:<elocation-id>1566</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fimmu.2017.01566</pub-id>
</citation>
</ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Sidney</surname> <given-names>J</given-names>
</name>
<name>
<surname>Pinilla</surname> <given-names>C</given-names>
</name>
<name>
<surname>Sette</surname> <given-names>A</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>Derivation of an Amino Acid Similarity Matrix for Peptide: MHC Binding and Its Application as a Bayesian Prior</article-title>. <source>BMC Bioinf</source> (<year>2009</year>) <volume>10</volume>:<fpage>394</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2105-10-394</pub-id>
</citation>
</ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mason</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>A Very High Level of Crossreactivity Is an Essential Feature of the T-Cell Receptor</article-title>. <source>Immunol Today</source> (<year>1998</year>) <volume>19</volume>:<fpage>395</fpage>&#x2013;<lpage>404</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0167-5699(98)01299-7</pub-id>
</citation>
</ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sioud</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>T-Cell Cross-Reactivity may Explain the Large Variation in How Cancer Patients Respond to Checkpoint Inhibitors</article-title>. <source>Scand J Immunol</source> (<year>2018</year>) <volume>87</volume>:<fpage>e12643</fpage>. doi: <pub-id pub-id-type="doi">10.1111/sji.12643</pub-id>
</citation>
</ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luksza</surname> <given-names>M</given-names>
</name>
<name>
<surname>Riaz</surname> <given-names>N</given-names>
</name>
<name>
<surname>Makarov</surname> <given-names>V</given-names>
</name>
<name>
<surname>Balachandran</surname> <given-names>VP</given-names>
</name>
<name>
<surname>Hellmann</surname> <given-names>MD</given-names>
</name>
<name>
<surname>Solovyov</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>A Neoantigen Fitness Model Predicts Tumour Response to Checkpoint Blockade Immunotherapy</article-title>. <source>Nature</source> (<year>2017</year>) <volume>551</volume>:<page-range>517&#x2013;20</page-range>. doi: <pub-id pub-id-type="doi">10.1038/nature24473</pub-id>
</citation>
</ref>
<ref id="B57">
<label>57</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sondka</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Bamford</surname> <given-names>S</given-names>
</name>
<name>
<surname>Cole</surname> <given-names>CG</given-names>
</name>
<name>
<surname>Ward</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Dunham</surname> <given-names>I</given-names>
</name>
<name>
<surname>Forbes</surname> <given-names>SA</given-names>
</name>
</person-group>. <article-title>The COSMIC Cancer Gene Census: Describing Genetic Dysfunction Across All Human Cancers</article-title>. <source>Nat Rev Cancer</source> (<year>2018</year>) <volume>18</volume>:<fpage>696</fpage>&#x2013;<lpage>705</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41568-018-0060-1</pub-id>
</citation>
</ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chronister</surname> <given-names>WD</given-names>
</name>
<name>
<surname>Crinklaw</surname> <given-names>A</given-names>
</name>
<name>
<surname>Mahajan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Vita</surname> <given-names>R</given-names>
</name>
<name>
<surname>Kosaloglu-Yalcin</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>Z</given-names>
</name>
<etal/>
</person-group>. <article-title>TCRMatch: Predicting T-Cell Receptor Specificity Based on Sequence Similarity to Previously Characterized Receptors</article-title>. <source>Front Immunol</source> (<year>2021</year>) <volume>12</volume>:<elocation-id>640725</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fimmu.2021.640725</pub-id>
</citation>
</ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vormehr</surname> <given-names>M</given-names>
</name>
<name>
<surname>Tureci</surname> <given-names>O</given-names>
</name>
<name>
<surname>Sahin</surname> <given-names>U</given-names>
</name>
</person-group>. <article-title>Harnessing Tumor Mutations for Truly Individualized Cancer Vaccines</article-title>. <source>Annu Rev Med</source> (<year>2019</year>) <volume>70</volume>:<fpage>395</fpage>&#x2013;<lpage>407</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev-med-042617-101816</pub-id>
</citation>
</ref>
<ref id="B60">
<label>60</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guedan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Ruella</surname> <given-names>M</given-names>
</name>
<name>
<surname>June</surname> <given-names>CH</given-names>
</name>
</person-group>. <article-title>Emerging Cellular Therapies for Cancer</article-title>. <source>Annu Rev Immunol</source> (<year>2019</year>) <volume>37</volume>:<page-range>145&#x2013;71</page-range>. doi: <pub-id pub-id-type="doi">10.1146/annurev-immunol-042718-041407</pub-id>
</citation>
</ref>
<ref id="B61">
<label>61</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tran</surname> <given-names>E</given-names>
</name>
<name>
<surname>Turcotte</surname> <given-names>S</given-names>
</name>
<name>
<surname>Gros</surname> <given-names>A</given-names>
</name>
<name>
<surname>Robbins</surname> <given-names>PF</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>YC</given-names>
</name>
<name>
<surname>Dudley</surname> <given-names>ME</given-names>
</name>
<etal/>
</person-group>. <article-title>Cancer Immunotherapy Based on Mutation-Specific CD4+ T Cells in a Patient With Epithelial Cancer</article-title>. <source>Science</source> (<year>2014</year>) <volume>344</volume>:<page-range>641&#x2013;5</page-range>. doi: <pub-id pub-id-type="doi">10.1126/science.1251102</pub-id>
</citation>
</ref>
<ref id="B62">
<label>62</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carreno</surname> <given-names>BM</given-names>
</name>
<name>
<surname>Magrini</surname> <given-names>V</given-names>
</name>
<name>
<surname>Becker-Hapak</surname> <given-names>M</given-names>
</name>
<name>
<surname>Kaabinejadian</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hundal</surname> <given-names>J</given-names>
</name>
<name>
<surname>Petti</surname> <given-names>AA</given-names>
</name>
<etal/>
</person-group>. <article-title>Cancer Immunotherapy. A Dendritic Cell Vaccine Increases the Breadth and Diversity of Melanoma Neoantigen-Specific T Cells</article-title>. <source>Science</source> (<year>2015</year>) <volume>348</volume>:<page-range>803&#x2013;8</page-range>. doi: <pub-id pub-id-type="doi">10.1126/science.aaa3828</pub-id>
</citation>
</ref>
<ref id="B63">
<label>63</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gubin</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Schuster</surname> <given-names>H</given-names>
</name>
<name>
<surname>Caron</surname> <given-names>E</given-names>
</name>
<name>
<surname>Ward</surname> <given-names>JP</given-names>
</name>
<name>
<surname>Noguchi</surname> <given-names>T</given-names>
</name>
<etal/>
</person-group>. <article-title>Checkpoint Blockade Cancer Immunotherapy Targets Tumour-Specific Mutant Antigens</article-title>. <source>Nature</source> (<year>2014</year>) <volume>515</volume>:<page-range>577&#x2013;81</page-range>. doi: <pub-id pub-id-type="doi">10.1038/nature13988</pub-id>
</citation>
</ref>
<ref id="B64">
<label>64</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hinrichs</surname> <given-names>CS</given-names>
</name>
<name>
<surname>Rosenberg</surname> <given-names>SA</given-names>
</name>
</person-group>. <article-title>Exploiting the Curative Potential of Adoptive T-Cell Therapy for Cancer</article-title>. <source>Immunol Rev</source> (<year>2014</year>) <volume>257</volume>:<fpage>56</fpage>&#x2013;<lpage>71</lpage>. doi: <pub-id pub-id-type="doi">10.1111/imr.12132</pub-id>
</citation>
</ref>
<ref id="B65">
<label>65</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Castle</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Kreiter</surname> <given-names>S</given-names>
</name>
<name>
<surname>Diekmann</surname> <given-names>J</given-names>
</name>
<name>
<surname>Lower</surname> <given-names>M</given-names>
</name>
<name>
<surname>van de Roemer</surname> <given-names>N</given-names>
</name>
<name>
<surname>de Graaf</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Exploiting the Mutanome for Tumor Vaccination</article-title>. <source>Cancer Res</source> (<year>2012</year>) <volume>72</volume>:<page-range>1081&#x2013;91</page-range>. doi: <pub-id pub-id-type="doi">10.1158/0008-5472.CAN-11-3722</pub-id>
</citation>
</ref>
<ref id="B66">
<label>66</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rosenberg</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Schwartzentruber</surname> <given-names>DJ</given-names>
</name>
<name>
<surname>Hwu</surname> <given-names>P</given-names>
</name>
<name>
<surname>Marincola</surname> <given-names>FM</given-names>
</name>
<name>
<surname>Topalian</surname> <given-names>SL</given-names>
</name>
<etal/>
</person-group>. <article-title>Immunologic and Therapeutic Evaluation of a Synthetic Peptide Vaccine for the Treatment of Patients With Metastatic Melanoma</article-title>. <source>Nat Med</source> (<year>1998</year>) <volume>4</volume>:<page-range>321&#x2013;7</page-range>. doi: <pub-id pub-id-type="doi">10.1038/nm0398-321</pub-id>
</citation>
</ref>
<ref id="B67">
<label>67</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rosato</surname> <given-names>A</given-names>
</name>
<name>
<surname>Zoso</surname> <given-names>A</given-names>
</name>
<name>
<surname>Milan</surname> <given-names>G</given-names>
</name>
<name>
<surname>Macino</surname> <given-names>B</given-names>
</name>
<name>
<surname>Dalla Santa</surname> <given-names>S</given-names>
</name>
<name>
<surname>Tosello</surname> <given-names>V</given-names>
</name>
<etal/>
</person-group>. <article-title>Individual Analysis of Mice Vaccinated Against a Weakly Immunogenic Self Tumor-Specific Antigen Reveals a Correlation Between CD8 T Cell Response and Antitumor Efficacy</article-title>. <source>J Immunol</source> (<year>2003</year>) <volume>171</volume>:<page-range>5172&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.4049/jimmunol.171.10.5172</pub-id>
</citation>
</ref>
<ref id="B68">
<label>68</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anichini</surname> <given-names>A</given-names>
</name>
<name>
<surname>Molla</surname> <given-names>A</given-names>
</name>
<name>
<surname>Mortarini</surname> <given-names>R</given-names>
</name>
<name>
<surname>Tragni</surname> <given-names>G</given-names>
</name>
<name>
<surname>Bersani</surname> <given-names>I</given-names>
</name>
<name>
<surname>Di Nicola</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>An Expanded Peripheral T Cell Population to a Cytotoxic T Lymphocyte (CTL)-Defined, Melanocyte-Specific Antigen in Metastatic Melanoma Patients Impacts on Generation of Peptide-Specific CTLs But Does Not Overcome Tumor Escape From Immune Surveillance in Metastatic Lesions</article-title>. <source>J Exp Med</source> (<year>1999</year>) <volume>190</volume>:<page-range>651&#x2013;67</page-range>. doi: <pub-id pub-id-type="doi">10.1084/jem.190.5.651</pub-id>
</citation>
</ref>
<ref id="B69">
<label>69</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ghorani</surname> <given-names>E</given-names>
</name>
<name>
<surname>Rosenthal</surname> <given-names>R</given-names>
</name>
<name>
<surname>McGranahan</surname> <given-names>N</given-names>
</name>
<name>
<surname>Reading</surname> <given-names>JL</given-names>
</name>
<name>
<surname>Lynch</surname> <given-names>M</given-names>
</name>
<name>
<surname>Peggs</surname> <given-names>KS</given-names>
</name>
<etal/>
</person-group>. <article-title>Differential Binding Affinity of Mutated Peptides for MHC Class I Is a Predictor of Survival in Advanced Lung Cancer and Melanoma</article-title>. <source>Ann Oncol</source> (<year>2018</year>) <volume>29</volume>:<page-range>271&#x2013;9</page-range>. doi: <pub-id pub-id-type="doi">10.1093/annonc/mdx687</pub-id>
</citation>
</ref>
<ref id="B70">
<label>70</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rech</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>Balli</surname> <given-names>D</given-names>
</name>
<name>
<surname>Mantero</surname> <given-names>A</given-names>
</name>
<name>
<surname>Ishwaran</surname> <given-names>H</given-names>
</name>
<name>
<surname>Nathanson</surname> <given-names>KL</given-names>
</name>
<name>
<surname>Stanger</surname> <given-names>BZ</given-names>
</name>
<etal/>
</person-group>. <article-title>Tumor Immunity and Survival as a Function of Alternative Neopeptides in Human Cancer</article-title>. <source>Cancer Immunol Res</source> (<year>2018</year>) <volume>6</volume>:<page-range>276&#x2013;87</page-range>. doi: <pub-id pub-id-type="doi">10.1158/2326-6066.CIR-17-0559</pub-id>
</citation>
</ref>
<ref id="B71">
<label>71</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brennick</surname> <given-names>CA</given-names>
</name>
<name>
<surname>George</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Moussa</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Hagymasi</surname> <given-names>AT</given-names>
</name>
<name>
<surname>Seesi</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Shcheglova</surname> <given-names>TV</given-names>
</name>
<etal/>
</person-group>. <article-title>An Unbiased Approach to Defining Bona Fide Cancer Neoepitopes That Elicit Immune-Mediated Cancer Rejection</article-title>. <source>J Clin Invest</source> (<year>2021</year>) <volume>131</volume>(<issue>3</issue>):<page-range>e142823</page-range>. doi: <pub-id pub-id-type="doi">10.1172/JCI142823</pub-id>
</citation>
</ref>
<ref id="B72">
<label>72</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ebrahimi-Nik</surname> <given-names>H</given-names>
</name>
<name>
<surname>Michaux</surname> <given-names>J</given-names>
</name>
<name>
<surname>Corwin</surname> <given-names>WL</given-names>
</name>
<name>
<surname>Keller</surname> <given-names>GL</given-names>
</name>
<name>
<surname>Shcheglova</surname> <given-names>T</given-names>
</name>
<name>
<surname>Pak</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Mass Spectrometry Driven Exploration Reveals Nuances of Neoepitope-Driven Tumor Rejection</article-title>. <source>JCI Insight</source> (<year>2019</year>) <volume>5</volume>(<issue>14</issue>):<page-range>e129152</page-range>. doi: <pub-id pub-id-type="doi">10.1172/jci.insight.129152</pub-id>
</citation>
</ref>
<ref id="B73">
<label>73</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>B</given-names>
</name>
<name>
<surname>Khodadoust</surname> <given-names>MS</given-names>
</name>
<name>
<surname>Olsson</surname> <given-names>N</given-names>
</name>
<name>
<surname>Wagar</surname> <given-names>LE</given-names>
</name>
<name>
<surname>Fast</surname> <given-names>E</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>CL</given-names>
</name>
<etal/>
</person-group>. <article-title>Predicting HLA Class II Antigen Presentation Through Integrated Deep Learning</article-title>. <source>Nat Biotechnol</source> (<year>2019</year>) <volume>37</volume>:<page-range>1332&#x2013;43</page-range>. doi: <pub-id pub-id-type="doi">10.1038/s41587-019-0280-2</pub-id>
</citation>
</ref>
<ref id="B74">
<label>74</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abelin</surname> <given-names>JG</given-names>
</name>
<name>
<surname>Harjanto</surname> <given-names>D</given-names>
</name>
<name>
<surname>Malloy</surname> <given-names>M</given-names>
</name>
<name>
<surname>Suri</surname> <given-names>P</given-names>
</name>
<name>
<surname>Colson</surname> <given-names>T</given-names>
</name>
<name>
<surname>Goulding</surname> <given-names>SP</given-names>
</name>
<etal/>
</person-group>. <article-title>Defining HLA-II Ligand Processing and Binding Rules With Mass Spectrometry Enhances Cancer Epitope Prediction</article-title>. <source>Immunity</source> (<year>2019</year>) <volume>51</volume>:<fpage>766</fpage>&#x2013;<lpage>79.e17</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.immuni.2019.08.012</pub-id>
</citation>
</ref>
<ref id="B75">
<label>75</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bulik-Sullivan</surname> <given-names>B</given-names>
</name>
<name>
<surname>Busby</surname> <given-names>J</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>CD</given-names>
</name>
<name>
<surname>Davis</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>Murphy</surname> <given-names>T</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Deep Learning Using Tumor HLA Peptide Mass Spectrometry Datasets Improves Neoantigen Identification</article-title>. <source>Nat Biotechnol</source> (<year>2018</year>) <volume>37</volume>:<fpage>55</fpage>&#x2013;<lpage>63</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nbt.4313</pub-id>
</citation>
</ref>
<ref id="B76">
<label>76</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muller</surname> <given-names>M</given-names>
</name>
<name>
<surname>Gfeller</surname> <given-names>D</given-names>
</name>
<name>
<surname>Coukos</surname> <given-names>G</given-names>
</name>    <name>
<surname>Bassani-Sternberg</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>'Hotspots' of Antigen Presentation Revealed by Human Leukocyte Antigen Ligandomics for Neoantigen Prioritization</article-title>. <source>Front Immunol</source> (<year>2017</year>) <volume>8</volume>:<elocation-id>1367</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fimmu.2017.01367</pub-id>
</citation>
</ref>
<ref id="B77">
<label>77</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bassani-Sternberg</surname> <given-names>M</given-names>
</name>
<name>
<surname>Chong</surname> <given-names>C</given-names>
</name>
<name>
<surname>Guillaume</surname> <given-names>P</given-names>
</name>
<name>
<surname>Solleder</surname> <given-names>M</given-names>
</name>
<name>
<surname>Pak</surname> <given-names>H</given-names>
</name>
<name>
<surname>Gannon</surname> <given-names>PO</given-names>
</name>
<etal/>
</person-group>. <article-title>Deciphering HLA-I Motifs Across HLA Peptidomes Improves Neo-Antigen Predictions and Identifies Allostery Regulating HLA Specificity</article-title>. <source>PloS Comput Biol</source> (<year>2017</year>) <volume>13</volume>:<fpage>e1005725</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pcbi.1005725</pub-id>
</citation>
</ref>
<ref id="B78">
<label>78</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cole</surname> <given-names>DK</given-names>
</name>
<name>
<surname>Bulek</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Dolton</surname> <given-names>G</given-names>
</name>
<name>
<surname>Schauenberg</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>Szomolay</surname> <given-names>B</given-names>
</name>
<name>
<surname>Rittase</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>Hotspot Autoimmune T Cell Receptor Binding Underlies Pathogen and Insulin Peptide Cross-Reactivity</article-title>. <source>J Clin Invest</source> (<year>2016</year>) <volume>126</volume>:<fpage>3626</fpage>. doi: <pub-id pub-id-type="doi">10.1172/JCI89919</pub-id>
</citation>
</ref>
<ref id="B79">
<label>79</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bethune</surname> <given-names>MT</given-names>
</name>
<name>
<surname>Joglekar</surname> <given-names>AV</given-names>
</name>
</person-group>. <article-title>Personalized T Cell-Mediated Cancer Immunotherapy: Progress and Challenges</article-title>. <source>Curr Opin Biotechnol</source> (<year>2017</year>) <volume>48</volume>:<page-range>142&#x2013;52</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.copbio.2017.03.024</pub-id>
</citation>
</ref>
<ref id="B80">
<label>80</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Linette</surname> <given-names>GP</given-names>
</name>
<name>
<surname>Stadtmauer</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Maus</surname> <given-names>MV</given-names>
</name>
<name>
<surname>Rapoport</surname> <given-names>AP</given-names>
</name>
<name>
<surname>Levine</surname> <given-names>BL</given-names>
</name>
<name>
<surname>Emery</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>Cardiovascular Toxicity and Titin Cross-Reactivity of Affinity-Enhanced T Cells in Myeloma and Melanoma</article-title>. <source>Blood</source> (<year>2013</year>) <volume>122</volume>:<page-range>863&#x2013;71</page-range>. doi: <pub-id pub-id-type="doi">10.1182/blood-2013-03-490565</pub-id>
</citation>
</ref>
<ref id="B81">
<label>81</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cameron</surname> <given-names>BJ</given-names>
</name>
<name>
<surname>Gerry</surname> <given-names>AB</given-names>
</name>
<name>
<surname>Dukes</surname> <given-names>J</given-names>
</name>
<name>
<surname>Harper</surname> <given-names>JV</given-names>
</name>
<name>
<surname>Kannan</surname> <given-names>V</given-names>
</name>
<name>
<surname>Bianchi</surname> <given-names>FC</given-names>
</name>
<etal/>
</person-group>. <article-title>Identification of a Titin-Derived HLA-A1-Presented Peptide as a Cross-Reactive Target for Engineered MAGE A3-Directed T Cells</article-title>. <source>Sci Transl Med</source> (<year>2013</year>) <volume>5</volume>:<fpage>197ra103</fpage>. doi: <pub-id pub-id-type="doi">10.1126/scitranslmed.3006034</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>