<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Immunol.</journal-id>
<journal-title>Frontiers in Immunology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Immunol.</abbrev-journal-title>
<issn pub-type="epub">1664-3224</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fimmu.2018.02294</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Immunology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Reference Grade Characterization of Polymorphisms in Full-Length HLA Class I and II Genes With Short-Read Sequencing on the ION PGM System and Long-Reads Generated by Single Molecule, Real-Time Sequencing on the PacBio Platform</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Suzuki</surname> <given-names>Shingo</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/566642/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Ranade</surname> <given-names>Swati</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Osaki</surname> <given-names>Ken</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ito</surname> <given-names>Sayaka</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Shigenari</surname> <given-names>Atsuko</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ohnuki</surname> <given-names>Yuko</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Oka</surname> <given-names>Akira</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Masuya</surname> <given-names>Anri</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Harting</surname> <given-names>John</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/579099/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Baybayan</surname> <given-names>Primo</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Kitazume</surname> <given-names>Miwako</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/566697/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sunaga</surname> <given-names>Junichi</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Morishima</surname> <given-names>Satoko</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Morishima</surname> <given-names>Yasuo</given-names></name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/139781/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Inoko</surname> <given-names>Hidetoshi</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Kulski</surname> <given-names>Jerzy K.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/605608/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Shiina</surname> <given-names>Takashi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/550671/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Division of Basic Medical Science and Molecular Medicine, Department of Molecular Life Science, Tokai University School of Medicine</institution>, <addr-line>Isehara</addr-line>, <country>Japan</country></aff>
<aff id="aff2"><sup>2</sup><institution>Molecular Biology Applications, Pacific Biosciences, Inc</institution>, <addr-line>Menlo Park, CA</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>Pacific Biosciences Division, Tomy Digital Biology Co., Ltd</institution>, <addr-line>Tokyo</addr-line>, <country>Japan</country></aff>
<aff id="aff4"><sup>4</sup><institution>The Institute of Medical Sciences, Tokai University</institution>, <addr-line>Isehara</addr-line>, <country>Japan</country></aff>
<aff id="aff5"><sup>5</sup><institution>GenoDive Pharma Inc.</institution>, <addr-line>Atsugi</addr-line>, <country>Japan</country></aff>
<aff id="aff6"><sup>6</sup><institution>Division of Endocrinology, Diabetes, and Metabolism, Hematology, Rheumatology (Second Department of Internal Medicine), Graduate School of Medicine, University of the Ryukyus</institution>, <addr-line>Nishihara</addr-line>, <country>Japan</country></aff>
<aff id="aff7"><sup>7</sup><institution>Department of Promotion for Blood and Marrow Transplantation, Aichi Medical University School of Medicine</institution>, <addr-line>Nagakute</addr-line>, <country>Japan</country></aff>
<aff id="aff8"><sup>8</sup><institution>School of Psychiatry and Clinical Neurosciences, The University of Western Australia</institution>, <addr-line>Perth, WA</addr-line>, <country>Australia</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Katharina Fleischhauer, Universit&#x000E4;tsklinikum Essen, Germany</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: M&#x000FC;berra Ahci, Universit&#x000E4;tsklinikum Essen, Germany; Neema P. Mayor, Anthony Nolan, United Kingdom; Vinzenz Lange, DKMS Life Science Lab GmbH, Germany</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Takashi Shiina <email>tshiina&#x00040;is.icc.u-tokai.ac.jp</email></corresp>
<fn fn-type="other" id="fn001"><p>This article was submitted to Alloimmunity and Transplantation, a section of the journal Frontiers in Immunology</p></fn></author-notes>
<pub-date pub-type="epub">
<day>04</day>
<month>10</month>
<year>2018</year>
</pub-date>
<pub-date pub-type="collection">
<year>2018</year>
</pub-date>
<volume>9</volume>
<elocation-id>2294</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>04</month>
<year>2018</year>
</date>
<date date-type="accepted">
<day>17</day>
<month>09</month>
<year>2018</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2018 Suzuki, Ranade, Osaki, Ito, Shigenari, Ohnuki, Oka, Masuya, Harting, Baybayan, Kitazume, Sunaga, Morishima, Morishima, Inoko, Kulski and Shiina.</copyright-statement>
<copyright-year>2018</copyright-year>
<copyright-holder>Suzuki, Ranade, Osaki, Ito, Shigenari, Ohnuki, Oka, Masuya, Harting, Baybayan, Kitazume, Sunaga, Morishima, Morishima, Inoko, Kulski and Shiina</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><p>Although NGS technologies fuel advances in high-throughput HLA genotyping methods for identification and classification of HLA genes to assist with precision medicine efforts in disease and transplantation, the efficiency of these methods are impeded by the absence of adequately-characterized high-frequency HLA allele reference sequence databases for the highly polymorphic HLA gene system. Here, we report on producing a comprehensive collection of full-length HLA allele sequences for eight classical HLA loci found in the Japanese population. We augmented the second-generation short read data generated by the Ion Torrent technology with long amplicon spanning consensus reads delivered by the third-generation SMRT sequencing method to create reference grade high-quality sequences of HLA class I and II gene alleles resolved at the genomic coding and non-coding level. Forty-six DNAs were obtained from a reference set used previously to establish the HLA allele frequency data in Japanese subjects. The samples included alleles with a collective allele frequency in the Japanese population of more than 99.2%. The HLA loci were independently amplified by long-range PCR using previously designed HLA-locus specific primers and subsequently sequenced using SMRT and Ion PGM sequencers. The mapped long and short-reads were used to produce a reference library of consensus HLA allelic sequences with the help of the reference-aware software tool LAA for SMRT Sequencing. A total of 253 distinct alleles were determined for 46 healthy subjects. Of them, 137 were novel alleles: 101 SNVs and/or indels and 36 extended alleles at a partial or full-length level. Comparing the HLA sequences from the perspective of nucleotide diversity revealed that HLA-DRB1 was the most divergent among the eight HLA genes, and that the HLA-DPB1 gene sequences diverged into two distinct groups, DP2 and DP5, with evidence of independent polymorphisms generated in exon 2. We also identified two specific intronic variations in HLA-DRB1 that might be involved in rheumatoid arthritis. In conclusion, full-length HLA allele sequencing by third-generation and second-generation technologies has provided polymorphic gene reference sequences at a genomic allelic resolution including allelic variations assigned up to the field-4 level for a stronger foundation in precision medicine and HLA-related disease and transplantation studies.</p></abstract>
<kwd-group>
<kwd>human leukocyte antigen</kwd>
<kwd>HLA</kwd>
<kwd>next-generation sequencing</kwd>
<kwd>NGS</kwd>
<kwd>SMRT sequencing</kwd>
<kwd>genotyping</kwd>
<kwd>PacBio RS II</kwd>
<kwd>Ion PGM</kwd>
</kwd-group>
<contract-num rid="cn001">16H06502</contract-num>
<contract-num rid="cn002">15ek0510002h0202</contract-num>
<contract-num rid="cn002">17ek0510022s0301</contract-num>
<contract-sponsor id="cn001">Ministry of Education, Culture, Sports, Science and Technology<named-content content-type="fundref-id">10.13039/501100001700</named-content></contract-sponsor>
<contract-sponsor id="cn002">Japan Agency for Medical Research and Development<named-content content-type="fundref-id">10.13039/100009619</named-content></contract-sponsor>
<counts>
<fig-count count="3"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="61"/>
<page-count count="15"/>
<word-count count="10832"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>The Major Histocompatibility Complex (MHC) comprising HLA class I and class II molecules (antigens) are polymorphic cell-membrane-bound glycoproteins that regulate the immune response by presenting peptides of fragmented proteins to circulating cytotoxic and helper T lymphocytes, respectively. These peptide-presenting-antigens are encoded by the genomic regions within the MHC that in humans are known specifically as the Human Leukocyte Antigen (HLA) class I and class II gene loci. The HLA molecules are investigated continuously due to their crucial role in the regulation of innate and adaptive immune responses (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>), during rejection, graft-versus-host disease (GVHD) of hematopoietic stem cell transplants (<xref ref-type="bibr" rid="B3">3</xref>, <xref ref-type="bibr" rid="B4">4</xref>) and the pathogenesis of numerous infectious and/or autoimmune diseases (<xref ref-type="bibr" rid="B5">5</xref>&#x02013;<xref ref-type="bibr" rid="B8">8</xref>).</p>
<p>Conventional PCR-based genotyping approaches incorporating restriction fragment length polymorphism (PCR-RFLP) (<xref ref-type="bibr" rid="B9">9</xref>), single strand conformation polymorphism (PCR-SSCP) (<xref ref-type="bibr" rid="B10">10</xref>), sequence-specific oligonucleotides (PCR-SSO) (<xref ref-type="bibr" rid="B11">11</xref>), sequence-specific primers (PCR-SSP) (<xref ref-type="bibr" rid="B12">12</xref>), and Sanger sequencing-based typing (PCR-SBT) (<xref ref-type="bibr" rid="B13">13</xref>) have been used for HLA-testing in disease association and pre-transplantation (<xref ref-type="bibr" rid="B14">14</xref>&#x02013;<xref ref-type="bibr" rid="B16">16</xref>) analysis. However, these methods are limited in their ability to decipher chromosomal phase (<italic>cis/trans</italic>) ambiguity and/or imprecise allele identification (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>) and may leave multiple pairs of HLA gene alleles unresolved. Moreover, the traditional methods focus only on the variations in the highly polymorphic regions of the HLA genes, and thus the majority of the assays only interrogate exons 2 and 3 or exons 2, 3, and 4 of the class I loci and exons 2 or exons 2 and 3 of class II. As a result, the genetic variations in the non-coding regions that regulate RNA expression levels (<xref ref-type="bibr" rid="B19">19</xref>&#x02013;<xref ref-type="bibr" rid="B21">21</xref>), or the exonic coding sequences outside of the polymorphic domains have remained largely ignored. On the other hand, methods that use full-length gene sequences including the promoter-enhancer region, 5&#x02032; and 3&#x02032; untranslated regions (UTRs), as well as all exonic and intronic regions for HLA genotyping, would be more accurate for the discovery of new polymorphisms associated with disease susceptibility and transplantation outcome. To this end, however, not more than 10% of &#x0007E; 17,700 known alleles in the IPD-IMGT/HLA reference database [Release 3.31, <ext-link ext-link-type="uri" xlink:href="https://www.ebi.ac.uk/ipd/imgt/hla/">https://www.ebi.ac.uk/ipd/imgt/hla/</ext-link>, (<xref ref-type="bibr" rid="B22">22</xref>)] are classified as full-length HLA gene sequences. Consequently, a comprehensive collection and classification of full-length HLA allele sequences including information from the &#x0201C;undetermined&#x0201D; regions of the HLA genes are desired to promote the future development of more accurate and reliable HLA genotyping methods.</p>
<p>During the past decade, next-generation sequencing (NGS) using mostly second-generation short-read sequencing technologies have employed exon sequencing for some or all of the HLA coding regions in an attempt to solve the phase ambiguity problem encountered by the conventional Sanger Sequencing-Based HLA genotyping methods (<xref ref-type="bibr" rid="B23">23</xref>). We previously reported on the development of super high resolution-sequence-based typing application using two NGS platforms, Ion PGM (Life Technologies) and GS Junior (Roche) (<xref ref-type="bibr" rid="B24">24</xref>&#x02013;<xref ref-type="bibr" rid="B26">26</xref>). In both of the studies, long-range PCR amplicons from the promoter-enhancer region to 3&#x02032;UTR for eight classical HLA loci, HLA-A, HLA-B, HLA-C, HLA-DRB1, HLA-DQA1, HLA-DQB1, HLA-DPA1, and HLA-DPB1 were shotgun sequenced. Other long-range PCR and NGS-based shotgun sequencing based HLA genotyping methods using the 454 GS-FLX (Roche) and the MiSeq/HiSeq (Illumina) platforms (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B27">27</xref>&#x02013;<xref ref-type="bibr" rid="B32">32</xref>) also can resolve many of the phase ambiguities. However, all of these methods are affected by the disadvantages associated with the short-read lengths of NGS technologies, which range from 150 to 500 bp. Although the short-read sequences can accurately separate the two phases in SNP dense regions, such as a polymorphic exon, the phasing is impossible in SNP deficient regions (Figure <xref ref-type="fig" rid="F1">1</xref>). Specifically, it is necessary to have at least two single nucleotide variants (SNVs) in one short-read sequence to separate both phases. The full-length HLA allele sequences are especially difficult to phase in the HLA-DQA1, HLA-DPA1, and HLA-DPB1 loci because their SNP densities are much less than in the other HLA loci (<xref ref-type="bibr" rid="B24">24</xref>), making it unlikely that two SNPs will appear in one short-read sequence.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>DNA based HLA-genotyping scheme for sequencing platforms representing the first-generation, second-generation and third-generation technologies. The phase ambiguities of the SNV G/A at loci SNV1, SNV2, and SNV3 are easier to resolve using 2nd and/or 3rd generation sequencing than 1st generation Sanger sequencing.</p></caption>
<graphic xlink:href="fimmu-09-02294-g0001.tif"/>
</fig>
<p>In contrast to the second-generation sequencers, the third-generation sequencers such as the Single Molecule, Real-Time (SMRT) Sequencing platform PacBio RS II provide continuous long-reads with an average read-length of 10 kb or more. The consensus sequences generated from these long-reads can resolve the limitations of the current second-generation NGS methods as they span most of the long-range PCR amplified regions of the HLA genes [Figure <xref ref-type="fig" rid="F1">1</xref>, (<xref ref-type="bibr" rid="B33">33</xref>, <xref ref-type="bibr" rid="B34">34</xref>)]. Thus, the PacBio platform alone, or in combination with the short-read sequencers such as Ion Torrent and the Illumina platforms, is expected to determine the HLA allele sequences at the full-length level.</p>
<p>In this paper, we describe the generation of a comprehensive collection of full-length HLA allele reference sequences from eight classical HLA loci (HLA-A, HLA-B, HLA-C, HLA-DRB1, HLA-DQA1, HLA-DQB1, HLA-DPA1, and HLA-DPB1) using both the SMRT and the Ion Torrent sequencing technologies. We used 46 genomic DNA samples from the healthy subjects that include 137 high-frequent HLA alleles resolved to the field-2 level (an allele resolution level of sequences that differs by a non-synonymous substitution) in the Japanese population (&#x0003E;99.8% cumulative allele frequencies in each locus). Also, we compared the classified full-length HLA allele sequences at each locus from the perspective of nucleotide diversity of SNVs and insertions or deletions (indels) within the noncoding regions. As an example of future HLA-related disease and transplantation studies, we identified specific variations and previously &#x0201C;undetermined&#x0201D; sequence regions in the HLA-DRB1 locus of these Japanese reference samples that might be related to rheumatoid arthritis (RA).</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and methods</title>
<sec>
<title>Genomic DNA samples previously genotyped for HLA polymorphisms to the field-2 level of allelic resolution</title>
<p>A total of 3,115 donors for bone marrow transplantation through the Japan Marrow Donor Program (JMDP) between 2006 and 2010 were retrospectively genotyped by the PCR-SSO-Luminex method for the HLA-A, HLA-B, HLA-C, HLA-DRB1, HLA-DQB1, HLA-DPB1 loci only up to the field-2 level of allelic variant designations as described elsewhere (<xref ref-type="bibr" rid="B35">35</xref>). Also, 400 healthy Japanese subjects collected at Tokai University were genotyped by PCR-SSO-Luminex method for the HLA-A, HLA-B, HLA-C, and HLA-DRB1 loci and by the PCR-SBT method for the HLA-DQB1 and HLA-DPB1 loci to the field-2 level (unpublished data). Based on the distribution of the HLA allele frequency data in the Japanese population (HLA laboratory: <ext-link ext-link-type="uri" xlink:href="http://www.hla.or.jp/haplo/haplonavi">http://www.hla.or.jp/haplo/haplonavi</ext-link>) (Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>), a reference set of 46 DNA samples [22 from JMDP (JPN01 to JPN22) and 24 from Tokai University (JPN23 to JPN46)] were selected from the larger number of low-resolution genotyped samples. These Japanese reference samples represented more than 99.6% of the known HLA alleles at each HLA locus excluding HLA-DQA1 and HLA-DPA1 with 137 alleles in total (19 HLA-A, 38 HLA-B, 17 HLA-C, 31 HLA-DRB1, 15 HLA-DQB1, and 17 HLA-DPB1) (Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>: blue background). The HLA genotyping results limited to the field-2 level of allelic resolution by the traditional HLA genotyping methods are shown in Table <xref ref-type="supplementary-material" rid="SM2">S2</xref>.</p>
</sec>
<sec>
<title>Long-range PCR</title>
<p>We used the previously designed HLA-A, HLA-B, HLA-C, HLA-DQA1, and HLA-DPA1 locus-specific primer sets that cover the whole gene regions from the promoter-enhancer region to 3&#x02032;UTR with the expected amplicon size of 5.5 kb for HLA-A, 4.6 kb for HLA-B, and 4.8 kb for HLA-C, 7.5 kb for HLA-DQA1, and 9.7 kb for HLA-DPA1 (<xref ref-type="bibr" rid="B24">24</xref>). For each of the HLA-DRB1, HLA-DQB1, and HLA-DPB1 loci the PCR regions were divided into two overlapping parts: 6.1&#x02013;11.2 kb for the enhancer-promoter to exon 2 (PCR amplicon name: DRB1-1) and 5.5&#x02013;6.7 kb for exon 2 to 3&#x02018;UTR (DRB1-2) in HLA-DRB1; 6.7 kb for the enhancer-promoter to exon 4 (DQB1-1) and 5.7 kb for intron 1&#x02013;3&#x02018;UTR (DQB1-2) in HLA-DQB1; and 5.9 kb for enhancer-promoter to intron 2 (DPB1-1) and 7.3 kb for intron 1&#x02013;3&#x02018;UTR (DPB1-2) in HLA-DPB1 (Figure <xref ref-type="supplementary-material" rid="SM8">S1</xref>). The PCR conditions were published previously (<xref ref-type="bibr" rid="B24">24</xref>). After amplification, the PCR amplicons were purified by the Agencourt AMPure XP (Beckman Coulter, Fullerton, CA) and quantified by the Quant-iT PicoGreen dsDNA Assay Kit (Invitrogen/Thermo Fisher Scientific, Carlsbad, CA) with a Fluoroskan Ascent Microplate Fluorometer (Thermo Fisher Scientific, Waltham, MA). We prepared the PCR amplicons separately for the PacBio and Ion PGM sequencing methods as described in the following sections.</p>
</sec>
<sec>
<title>Sequencing using the PacBio RS II sequencer</title>
<p>We partitioned the 11 long-range PCR amplicons from the eight HLA loci into three groups based on the expected length of the PCR amplicons and constructed three sets of pooled libraries. Pool-1 included HLA-A, -B, and -C (4.6&#x02013;5.5 kb) gene amplicons, pool-2 consisted of HLA-DRB1-2, -DQB1-1, -DQB1-2, and -DPB1-1 (5.5&#x02013;6.7 kb) and pool-3 included HLA-DRB1-1, -DQA1, -DPA1, and -DPB1-2 (6.1&#x02013;11.2 kb) (Figure <xref ref-type="supplementary-material" rid="SM8">S1</xref>). The quantity and size distribution of the PCR amplicons were measured using the Qubit Fluorometer (Life Technologies/Thermo Fisher Scientific, Palo Alto, CA) and Agilent 2100 Bioanalyzer DNA12000 kit (Agilent Technologies, Santa Clara, CA). The total amount of pooled amplicon DNA input into each library preparation ranged between 3 and 4 micrograms. Using the PacBio DNA Template Prep Kit 2.0 and SMRTbell Barcoded Adapter Complete Prep Kit (Pacific Biosciences, Menlo Park, CA), the pooled PCR amplicons were end-repaired, and blunt-end ligated to barcoded hairpin adapters to produce SMRTbell templates. A 0.45 &#x000D7; volume of AMPure PB beads was used to purify the barcoded SMRTbell libraries before sequencing. A binding calculator provided by PacBio determined the ratio of sequencing primer to template and polymerase to template and optimal loading concentration in the SMRT Cell. The SMRTbell templates were bound to P6 DNA polymerase. To remove excess polymerase and primer, the SMRTbell-polymerase complex was bound to MagBeads at 4&#x000B0;C for 20 min, using manufacturer&#x00027;s guidelines. The MagBeads-bound polymerase-template complexes were run in the PacBio RS II for sequencing. The most advanced sequencing chemistry (P6-C4) for the PacBio RSII Sequencing System, was used to generate long-read sequences spanning the complete lengths of the input long-range PCR amplicons. The most optimal movie collection time was employed to capture full-length reads. A 240-min movie was collected for the first pool (4.6&#x02013;5.5 kb), and 360 min movies were collected for the second (5.5&#x02013;6.7 kb), and third (6.1&#x02013;11.2 kb) libraries to produce maximum number of full-length reads. In total, six SMRT Cells were run for sequencing, two for each of the pooled libraries 1, 2, and 3. After sequencing, the analysis of the consensus sequences was done independently for each of the pooled libraries 1, 2, and 3. Clustering, phasing, consensus building, post-processing and evaluation of the consensus sequences were performed using the Long Amplicon Analysis (LAA) computing pipeline of the SMRT Analysis v2.3 program (<ext-link ext-link-type="uri" xlink:href="http://www.pacb.com/wp-content/uploads/guide-pacbio-HLA-getting-started.pdf">http://www.pacb.com/wp-content/uploads/guide-pacbio-HLA-getting-started.pdf</ext-link>). Sequencing data were first filtered to remove all subreads with predicted accuracy of &#x0003C;80%, lengths of &#x0003C;90% of the shortest amplicon in each pool, and a signal-to-noise ratio (SNR) of less than 4.0. For each pool, up to 5,000 of the remaining high-quality, full-length reads were used for the LAA analysis with default phasing parameters (maximum phasing reads &#x0003D; 500, minimum split fraction &#x0003D; 0.1).</p>
</sec>
<sec>
<title>Sequencing using the ion PGM sequencer</title>
<p>Barcoded-library DNA samples were prepared with an Ion Xpress Plus Fragment Library Kit and Ion Xpress barcode Adaptors 1&#x02013;96 Kit according to the manufacturer&#x00027;s protocol for 400 base-read sequencing (Life Technologies/Thermo Fisher Scientific). One hundred nanograms of the multiplex PCR amplicons were used for the preparation of each DNA barcoded-library. DNA samples were fragmented with an M220 Focused-ultrasonicator (Covaris, Woburn, MA). Eight cycles of PCR were used to amplify each DNA library. The DNA size and quantitation for each library were measured with an Agilent 2100 Expert Bioanalyzer using the Agilent High Sensitivity DNA Kit (Agilent Technologies). Each barcoded-library was mixed at equimolar concentrations then diluted according to the manufacturer&#x00027;s recommendation. Emulsion PCR (emPCR) was performed on the resulting pooled library with the Ion PGM Template OT2 400 Kit on an Ion OneTouch 2 automated system (Life Technologies/Thermo Fisher Scientific). After the emulsion was automatically broken with the OneTouch 2 instrument, the beads carrying the single-stranded DNA templates were enriched according to the manufacturer&#x00027;s recommendation. Sequencing was performed using the Ion PGM Sequencing 400 Kit and Ion 318 Chip Kit v2 with a flow number of 850 for a 400 base-read (<xref ref-type="bibr" rid="B36">36</xref>). The raw data processing and base-calling, trimming, and output of quality-filter sequence reads were binned by the Ion Xpress Barcodes into 46 separate sequence fastq files using the Torrent Suite 4.2.1 software (Life Technologies/Thermo Fisher Scientific) with full processing for shotgun analysis. These sequence data files were further quality trimmed to remove poor sequences at the end of the reads with Quality values (QVs) of &#x0003C;15. The trimmed and barcode-binned sequence reads were used for HLA allele assignment to the field-2 level using the in-house Sequence Alignment Based Assigning Software [SeaBass, Tokai University, (<xref ref-type="bibr" rid="B37">37</xref>)]. QVs of sequence reads were calculated by the fastx_quality_stats included with the FASTX-Toolkit for short-reads data preprocessing (<ext-link ext-link-type="uri" xlink:href="http://hannonlab.cshl.edu/fastx_toolkit/">http://hannonlab.cshl.edu/fastx_toolkit/</ext-link>).</p>
</sec>
<sec>
<title>Allele sequence determination of full-length reference sequences</title>
<p>We used two complementing sequencing technologies to characterize the HLA alleles; generally, the PGM short-read sequences for genotyping and the PacBio long-read consensus sequences to phase the HLA allele sequences. In order to obtain more accurate nucleotide sequences, short-read sequence outputs by Ion PGM sequencing were mapped to the long-read consensus sequences that were produced by PacBio RS II sequencing using the GS Reference Mapper Ver. 3.0 software (Roche, Basel, Switzerland). To avoid mismapping among the HLA loci and contamination of the <italic>in vitro</italic> generated PCR crossover amplicons (<xref ref-type="bibr" rid="B37">37</xref>, <xref ref-type="bibr" rid="B38">38</xref>), we first used the software mapping parameters that found perfect alignment matches between the read sequences and the reference sequences using the following settings: Minimum overlap identity: 100, Minimum read length: 45, Minimum overlap length: 200, Alignment identity score: 10, and Alignment difference score: 0. We confirmed high percent coverage of the references in the Profile window, and visually inspected the sequence alignments for nucleotide mismatches in the results window using the parameter setting called Open the Alignment. The long-read consensus sequences were considered to be correct when they and the short-read sequences aligned uniformly and correctly to the reference sequence. When there were unmapped nucleotide sites or mismatches in the sequence alignments, we realigned the short-read sequences to the long-read consensus sequences by changing the Minimum overlap identity parameter from 100 to 99. From the new alignment information obtained at a slightly lower stringency, we manually modified the long-read consensus sequences based on the information of direct matches between the short-read sequences and the previously unmodified consensus sequences. The modified long-read consensus sequences that remained doubtful were checked and confirmed by Sanger direct-sequencing.</p>
</sec>
<sec>
<title>Sanger sequencing using the ABI3130xl genetic analyzer</title>
<p>Purified PCR amplicons were sequenced bidirectionally, to validate newly discovered SNVs and indels with the Big Dye Terminator Kit v.1.1 (Life Technologies/Thermo Fisher Scientific) using the ABI3130xl genetic analyzer (Life Technologies/Thermo Fisher Scientific). The generated chromatogram sequence data were analyzed by the Sequencher ver.5.0.1 DNA sequence assembly software (GENCODE).</p>
</sec>
<sec>
<title>Nucleotide diversity analysis</title>
<p>Multiple sequence alignments for each locus were created using the Sequencher ver.5.0.1 DNA sequence assembly software (GENCODE). The diversity profile was calculated and drawn using the graphics output of the Microsoft Excel for Mac 2011. Repetitive elements including retroelements were identified within the HLA allele sequences by using the RepeatMasker webserver (<ext-link ext-link-type="uri" xlink:href="http://www.repeatmasker.org">http://www.repeatmasker.org</ext-link>).</p>
</sec>
<sec>
<title>Phylogenetic analysis</title>
<p>Multiple sequence alignments for each locus were created using the ClustalW Sequence Alignment program of the Molecular Evolution Genetics Analysis software 6 (MEGA6) (<xref ref-type="bibr" rid="B39">39</xref>). Phylogenetic trees were constructed by the Neighbor-joining (NJ) method with Maximum Composite Likelihood model and assessed using 10,000 bootstrap replicates in the MEGA6 software (<xref ref-type="bibr" rid="B40">40</xref>).</p>
</sec>
<sec>
<title>Allele assignments and nomenclature</title>
<p>The HLA alleles were assigned using HLA Fusion 3.0 Software (One Lambda/Life Technologies, Canoga Park CA) for the PCR-SSO-Luminex data, u-Type 7.1 software (One Lambda) for the SBT data, and Blat sequence alignment search for the downloaded IPD-IMGT/HLA alleles (Release 3.31.0) and for the PacBio and Ion PGM data. The IPD-IMGT/HLA database assigned the HLA allele official names following the nomenclature for factors of the HLA System using the four-fields of allelic resolution (allelic variants) based on the different levels of variation in the DNA sequences. (<xref ref-type="bibr" rid="B41">41</xref>). Field-1 is the allelic lineage or group that is shared by all allele variants in that group; field-2 defines a DNA variation that leads to an amino acid difference (non-synonymous DNA substitution) in the allele group defined by field-1; field-3 indicates the synonymous DNA substitution in the coding region of the allelic group; and field-4 refers to differences in the non-coding regions of the allelic group. (<xref ref-type="bibr" rid="B42">42</xref>). HLA exonic sequencing is limited to the field-3 level of allelic resolution, whereas HLA genomic coding and non-coding sequencing extends the allelic resolution up to the field-4 level. However, a unique allele with no variants that has been completely sequenced at the genomic field-4 level is usually given only a two-field name (such as B<sup>&#x0002A;</sup>15:428), and although somewhat confusing, we have retained this practice here.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec>
<title>Characteristics of draft-reads for PacBio RS II and ion PGM sequencing</title>
<p>Raw subread information of draft-reads obtained for 46 genomic DNA samples after sequencing the 11 long-range PCR amplicons by the PacBio RS II sequencer is shown in Table <xref ref-type="supplementary-material" rid="SM3">S3</xref> and includes SMRT Cell numbers, P1 and P2 values that mean the rates of productive ZMW and other ZMW in SMRT cells, respectively, the minimum, mean, and maximum subread numbers and mean quality values per sample for each primer set. The mean P1-values ranged from 36.7 to 46.1% and the mean P2-values ranged from 6.7 to 10.1%. The highest and lowest mean numbers were observed for the DQB1-1&#x0002B;DQB1-2 primer sets (1,319 subreads ranging from 567 to 2,071) and the DPA1 primer set (63 subreads ranging from 44 to 82), respectively. Less than one hundred minimum subreads were obtained in pool-3 that included long-range PCR amplicons of 6.1&#x02013;11.2 kb, whereas over one hundred minimum subreads were obtained in pool-1 and pool-2 that included comparatively shorter PCR amplicons of 4.6&#x02013;6.7 kb. No subreads were obtained for allele 2 of the DPA1 gene in JPN29. In total, 692 consensus sequences were generated from the subreads using the LAA pipeline in preparation for constructing and mapping the full-length HLA allele sequences using the consensus sequences.</p>
<p>A summary of the number of draft-read bases obtained from 46 genomic DNA samples after sequencing individual HLA loci using the Ion PGM sequencer is presented in Table <xref ref-type="supplementary-material" rid="SM4">S4</xref>. Draft-read numbers were high-quality reads, and in total there was 15,016,797 sequence reads from two runs with read numbers ranging from 106,840 in JPN10 to 707,242 in JPN33 [326,452.1 &#x000B1; 141,566.9 standard deviation (SD) on average]. The average quality score and SD were 27.0 &#x000B1; 0.6. The draft-read bases in total were 3.8 Gb with a range between 23.1 Mb in JPN10 and 159.1 Mb in JPN33 (83.2 &#x000B1; 35.3 Mb on average), with an overall average, read length of 255.9 &#x000B1; 12.8 bases.</p>
</sec>
<sec>
<title>Comparison between the PacBio and ion PGM data for coding sequences</title>
<p>From a nucleotide similarity search of short-read sequences by Ion PGM sequencing 44 homozygous genotypes were identified from a total of 368 genotyped (46 samples &#x000D7; 8 loci) coding sequences (CDSs) (Table <xref ref-type="supplementary-material" rid="SM5">S5</xref>). Allele dropouts were not included in the analyses of these HLA-A, -B, -C, -DRB1, -DQB1, and -DPB1 sequences because the genotypes were consistent with the results of PCR-SSO and SBT (Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). However, it is possible that there was allele dropout in the homozygous genotypes of HLA-DPA1 and -DQA1. The five alleles represented by the HLA-B genes of JPN34 and JPN36, and HLA-DPA1 of JPN04, JPN25, and JPN37 showed 99.9 and 99.4% nucleotide similarity to the most similar previously documented alleles, respectively, while the other alleles were perfectly matched to known sequences. All typing data were identical with the retrospectively genotyped data (Table <xref ref-type="supplementary-material" rid="SM2">S2</xref>), excluding a single discrepancy for HLA-C<sup>&#x0002A;</sup>08:01 in JPN04 and HLA-C<sup>&#x0002A;</sup>08:22 in JPN30 due to an SNV that separated the alleles in exon 6.</p>
<p>The PacBio consensus sequences were used as reference sequences for mapping the short-read sequence outputs by Ion PGM sequencing. Although the output from the PacBio RS II sequencing identified 44 homozygous genotypes, the comparison of the nucleotide similarities between both sets of sequencing data revealed artifactual dropouts for four alleles, HLA-B of JPN04, HLA-DQA1 of JPN10, and HLA-DPA1 of JPN29, and a mismatch for one allele of HLA-DQB1 of JPN20 (Table <xref ref-type="supplementary-material" rid="SM5">S5</xref>). DNA typing of these samples by the PCR-SSO-Luminex and PCR-SBT methods confirmed that these were dropouts in the PacBio data. The four dropout allele sequences were determined by comparing the most similar allele sequences within the reference sequence group against those that were determined in other samples using the Ion PGM reads.</p>
</sec>
<sec>
<title>Characterization and allele assignment of the full-length, polymorphic class I and class II HLA sequences to establish a population reference group</title>
<p>A total of 253 HLA allele sequences (20 HLA-A, 46 HLA-B, 26 HLA-C, 41 HLA-DRB1, 36 HLA-DQA1, 28 HLA-DQB1, 16 HLA-DPA1, and 40 HLA-DPB1) that covered the promoter-enhancer region, the intronic and exonic regions and across to 3&#x02032;UTR were determined for the 46 Japanese samples by the PacBio, Ion PGM, and Sanger sequencing. Table <xref ref-type="supplementary-material" rid="SM6">S6</xref> shows the genomic allele designation of the full-length HLA alleles (coding and non-coding sequences) up to the field-4 level for some variants for each sample and locus. Table <xref ref-type="supplementary-material" rid="SM7">S7</xref> shows the allele names, DNA data bank of Japan (DDBJ) accession numbers, IMGT submission numbers, nucleotide length of each allele, novel or extended alleles, the location of variations, and the number of detected alleles.</p>
<p>The two alleles B<sup>&#x0002A;</sup>40:01:02:01/04 and DQB1<sup>&#x0002A;</sup>03:03:02:02/03 were classified as ambiguous because some nucleotide variations previously used to assign these alleles were located outside the region of our two sequences. Of the 736 alleles, 181 alleles (24.6%) were novel, and 23.9% (176/736) of them had variations within introns or in the 5&#x02032; and 3&#x02032; non-coding regions. Also, 193 alleles were extended from an exonic or partial gene sequence to a full-gene sequence, and 50.8% of the 736 alleles were reassigned in the IPD-IMGT/HLA database as novel allele sequences. Also, 89.6% of the HLA-DRB1 allele sequences are unique or extended alleles (Table <xref ref-type="table" rid="T1">1</xref> and Table <xref ref-type="supplementary-material" rid="SM7">S7</xref>). Of the 101 novel alleles, four had variants in the exonic regions, and of them, B<sup>&#x0002A;</sup>15:428, DPA1<sup>&#x0002A;</sup>02:07:01:01, and DPA1<sup>&#x0002A;</sup>02:08 had non-synonymous substitutions (Table <xref ref-type="table" rid="T2">2</xref>). The five alleles (HLA-B of JPN34 and JPN36 and HLA-DPA1 of JPN04, JPN25, and JPN37) that showed 99.9 or 99.4% nucleotide similarities in the CDS search were also classified as novel alleles (Table <xref ref-type="supplementary-material" rid="SM5">S5</xref>). Of the 44 genotypes that initially were classified as homozygous within the coding regions, seven of them were revealed as heterozygotes within the intronic region (Table <xref ref-type="supplementary-material" rid="SM5">S5</xref>).</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Characterization of 253 distinct full-length HLA alleles.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left"><bold>Locus</bold></th>
<th valign="top" align="center"><bold>Distinct sequences</bold></th>
<th valign="top" align="center"><bold>Total sequences</bold></th>
<th valign="top" align="center" colspan="3"><bold>Detected novel allele number</bold></th>
<th valign="top" align="center"><bold>Novel alleles/all alleles</bold></th>
<th valign="top" align="center"><bold>Detected extended allele number</bold></th>
<th valign="top" align="center"><bold>Novel &#x0002B; extended alleles/all alleles</bold></th>
</tr>
<tr>
<th/>
<th/>
<th/>
<th valign="top" align="center"><bold>Coding region</bold></th>
<th valign="top" align="center"><bold>Intronic region</bold></th>
<th valign="top" align="center"><bold>5&#x02032;/3&#x02032;Non-coding region</bold></th>
<th/>
<th/>
<th/>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">A</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1.1%</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">3.3%</td>
</tr>
<tr>
<td valign="top" align="left">B</td>
<td valign="top" align="center">46</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">15.2%</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">23.9%</td>
</tr>
<tr>
<td valign="top" align="left">C</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">12.0%</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">43.5%</td>
</tr>
<tr>
<td valign="top" align="left">DRB1</td>
<td valign="top" align="center">41</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">45</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">48.9%</td>
<td valign="top" align="center">37</td>
<td valign="top" align="center">89.1%</td>
</tr>
<tr>
<td valign="top" align="left">DQA1</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">31.5%</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">54.3%</td>
</tr>
<tr>
<td valign="top" align="left">DQB1</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">40.2%</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">45.7%</td>
</tr>
<tr>
<td valign="top" align="left">DPA1</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">15.2%</td>
<td valign="top" align="center">69</td>
<td valign="top" align="center">90.2%</td>
</tr>
<tr>
<td valign="top" align="left">DPB1</td>
<td valign="top" align="center">40</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">30</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">32.6%</td>
<td valign="top" align="center">22</td>
<td valign="top" align="center">56.5%</td>
</tr>
<tr style="border-top: thin solid #000000;">
<td valign="top" align="left">Total</td>
<td valign="top" align="center">253</td>
<td valign="top" align="center">736</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">153</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">24.6%</td>
<td valign="top" align="center">193</td>
<td valign="top" align="center">50.8%</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Identification and classification of novel variants in exonic regions.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left"><bold>Sample ID</bold></th>
<th valign="top" align="left"><bold>JPN34</bold></th>
<th valign="top" align="left"><bold>JPN36</bold></th>
<th valign="top" align="center" colspan="3"><bold>JPN04, JPN25</bold></th>
<th valign="top" align="left"><bold>JPN37</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Locus</td>
<td valign="top" align="left">HLA-B</td>
<td valign="top" align="left">HLA-B</td>
<td valign="top" align="center" colspan="3">HLA-DPA1</td>
<td valign="top" align="left">HLA-DPA1</td>
</tr>
<tr>
<td valign="top" align="left">Novel allele name</td>
<td valign="top" align="left">B&#x0002A;15:428</td>
<td valign="top" align="left">B&#x0002A;39:02:03</td>
<td valign="top" align="center" colspan="3">DPA1&#x0002A;02:07:01:01</td>
<td valign="top" align="left">DPA1&#x0002A;02:08</td>
</tr>
<tr>
<td valign="top" align="left">Reference</td>
<td valign="top" align="left">B&#x0002A;15:28</td>
<td valign="top" align="left">B&#x0002A;39:02:02</td>
<td valign="top" align="center" colspan="3">DPA1&#x0002A;02:02:01</td>
<td valign="top" align="left">DPA1&#x0002A;02:01:01:02</td>
</tr>
<tr>
<td valign="top" align="left">IMGT num. of reference</td>
<td valign="top" align="left">HLA00191</td>
<td valign="top" align="left">HLA00275</td>
<td valign="top" align="center" colspan="3">HLA00508</td>
<td valign="top" align="left">HLA14197</td>
</tr>
<tr>
<td valign="top" align="left">Reference position</td>
<td valign="top" align="left">25</td>
<td valign="top" align="left">1,008</td>
<td valign="top" align="left">251</td>
<td valign="top" align="left">361</td>
<td valign="top" align="left">442</td>
<td valign="top" align="left">4893</td>
</tr>
<tr>
<td valign="top" align="left">Location</td>
<td valign="top" align="left">Exon 1</td>
<td valign="top" align="left">Exon 5</td>
<td valign="top" align="left">Exon 3</td>
<td valign="top" align="left">Exon 3</td>
<td valign="top" align="left">Exon 3</td>
<td valign="top" align="left">Exon 4</td>
</tr>
<tr>
<td valign="top" align="left">Nucleotide Reference</td>
<td valign="top" align="left">G</td>
<td valign="top" align="left">C</td>
<td valign="top" align="left">G</td>
<td valign="top" align="left">A</td>
<td valign="top" align="left">A</td>
<td valign="top" align="left">G</td>
</tr>
<tr>
<td valign="top" align="left">Nucleotide Variant</td>
<td valign="top" align="left">C</td>
<td valign="top" align="left">T</td>
<td valign="top" align="left">A</td>
<td valign="top" align="left">G</td>
<td valign="top" align="left">G</td>
<td valign="top" align="left">A</td>
</tr>
<tr>
<td valign="top" align="left">Amino acid substitution</td>
<td valign="top" align="left">V9L</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">V122M</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">-</td>
<td valign="top" align="left">R249H</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>A hyphen indicates synonymous substitution</italic>.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>Nucleotide diversity and phylogenetic analyses of HLA allele sequences</title>
<p>To calculate and map the nucleotide diversities for each HLA locus we constructed multiple sequence alignments and nucleotide diversity profiles at the locus level using all of the allele sequences identified in this study (Figure <xref ref-type="supplementary-material" rid="SM9">S2</xref>). The indel numbers and SNV rates (SNV/Kb: number of SNVs/alignment length excluding indels/allele numbers &#x000D7; 1000) in the class I loci (HLA-A, HLA-B, and HLA-C) showed comparatively low rates with 11&#x02013;13 numbers for indels and 1.4&#x02013;3.1 SNV/Kb (Table <xref ref-type="table" rid="T3">3</xref>). The indels were dispersed mainly within the intronic regions, whereas highest SNV/Kb were observed in the exonic regions such as exons 2 and 3 in HLA-A and HLA-B and across all the exons in HLA-C (Figures <xref ref-type="supplementary-material" rid="SM9">S2A</xref>&#x02013;<xref ref-type="supplementary-material" rid="SM9">C</xref>). In comparison to the class I loci, the class II loci showed a higher level of locus-specific indels with 22&#x02013;144 numbers and a moderately high level of SNV rates with 2.2&#x02013;5.3/Kb at the allele level (Table <xref ref-type="table" rid="T3">3</xref>).</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>The number of indels and SNVs among the alleles at each HLA locus.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left"><bold>Locus</bold></th>
<th valign="top" align="center"><bold>Allele number to the full-length level</bold></th>
<th valign="top" align="center" style="border-bottom: thin solid #000000;" colspan="2"><bold>Including indels</bold></th>
<th valign="top" align="center" style="border-bottom: thin solid #000000;" colspan="2"><bold>Excluding indels</bold></th>
<th valign="top" align="center"><bold>SNV/Kb</bold></th>
</tr>
<tr>
<th/>
<th/>
<th valign="top" align="center"><bold>Alignment length (bp)</bold></th>
<th valign="top" align="center"><bold>Number of indels</bold></th>
<th valign="top" align="center"><bold>Alignment length (bp)</bold></th>
<th valign="top" align="center"><bold>Number of SNVs</bold></th>
<th/>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">A</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">5,436</td>
<td valign="top" align="center">13</td>
<td valign="top" align="center">5,396</td>
<td valign="top" align="center">336</td>
<td valign="top" align="center">3.1</td>
</tr>
<tr>
<td valign="top" align="left">B</td>
<td valign="top" align="center">46</td>
<td valign="top" align="center">4,575</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">4,541</td>
<td valign="top" align="center">285</td>
<td valign="top" align="center">1.4</td>
</tr>
<tr>
<td valign="top" align="left">C</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">4,760</td>
<td valign="top" align="center">12</td>
<td valign="top" align="center">4,733</td>
<td valign="top" align="center">246</td>
<td valign="top" align="center">2.0</td>
</tr>
<tr style="border-top: thin solid #000000;">
<td valign="top" align="left">DRB1</td>
<td valign="top" align="center">41</td>
<td valign="top" align="center">18,740</td>
<td valign="top" align="center">144</td>
<td valign="top" align="center">10,262</td>
<td valign="top" align="center">1,727</td>
<td valign="top" align="center">2.2</td>
</tr>
<tr>
<td valign="top" align="left">DQA1</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">7,801</td>
<td valign="top" align="center">77</td>
<td valign="top" align="center">7,240</td>
<td valign="top" align="center">957</td>
<td valign="top" align="center">3.4</td>
</tr>
<tr>
<td valign="top" align="left">DQB1</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">8,393</td>
<td valign="top" align="center">107</td>
<td valign="top" align="center">7,551</td>
<td valign="top" align="center">1,247</td>
<td valign="top" align="center">5.3</td>
</tr>
<tr>
<td valign="top" align="left">DPA1</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">9,766</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">9,662</td>
<td valign="top" align="center">348</td>
<td valign="top" align="center">2.2</td>
</tr>
<tr>
<td valign="top" align="left">DPB1</td>
<td valign="top" align="center">40</td>
<td valign="top" align="center">12,306</td>
<td valign="top" align="center">22</td>
<td valign="top" align="center">12,147</td>
<td valign="top" align="center">343</td>
<td valign="top" align="center">0.7</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Indels of over 500 bp were observed in introns 1, 2, and 5, and many of them explicitly correlated with the DR supratypes. Most of the indels were composed of repetitive elements such as short interspersed nuclear element (SINE) and long interspersed nuclear element (LINE) sequences located in position 5,264&#x02013;10,528 bp of intron 1, position 2,214&#x02013;3,464 bp of intron 2 and position 627&#x02013;1,142 bp of intron 5 (Figure <xref ref-type="fig" rid="F2">2</xref> and Figure <xref ref-type="supplementary-material" rid="SM9">S2D</xref>). This result of the correlation between structurally polymorphic retrotransposons and the HLA-DR supratypes DR1, DR8, DR51, DR52, and DR53 supports and extends the previous findings (<xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B44">44</xref>). The relationships of the DR supratypes and the indels also were strongly supported by a phylogenetic tree that was constructed using selected intronic 1, 2, and 5 sequences (Figure <xref ref-type="fig" rid="F2">2</xref>). Also, the transcription factor binding motifs such as X1, X2, Y, CCAAT, and TATA boxes (<xref ref-type="bibr" rid="B45">45</xref>) appear to have evolved according to the lineages of the DR-types (data not shown). The highest SNV/Kb were observed mostly around the exon 2 and intron 5 regions.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>Gene structure, DR supratypes and phylogenetic relationships using the HLA-DRB1 allele sequences. Three of the DR supratypes are labeled DR53, DR51, and DR52, and their component alleles are listed underneath the horizontal lines. The phylogenetic tree of the HLA-DRB1 alleles ranging from DRB1<sup>&#x0002A;</sup>07 to the left of the figure and DRB1<sup>&#x0002A;</sup>03 to the right of the figure was constructed using the Neighbor-Joining method and a 1,962 bp nucleotide alignment that included 261 bp of AluJb, 492 bp of L2a, 281 bp of AluSc8, 655 bp of L2a, and 65 bp of MER53 in intron 1, and 145 bp of MIR in intron 2 and 63 bp of MIR in intron 5. Numbers on the branches are bootstrap support values. Red letters indicate Alu and LINE sequences that may have been inserted in the comparatively recent period during the last 10 million years. Gray bars indicate the exonic regions and the white open regions with the retroelement lists between the gray bars represent introns 1 to 5 in between exons 1 and 6.</p></caption>
<graphic xlink:href="fimmu-09-02294-g0002.tif"/>
</fig>
<p>In regard to the nucleotide diversity within the other class II genes, the indel numbers were 77 and 107 for the HLA-DQA1 and HLA-DQB1 loci, respectively, and significant indels were observed in the introns 2 and 3 of HLA-DQA1 and intron 2 of HLA-DQB1 (Figures <xref ref-type="supplementary-material" rid="SM9">S2E,F</xref>). The SNV/Kb was 3.4 and 5.3 for HLA-DQA1 and HLA-DQB1, respectively, which was similar for the HLA-DRB1 locus (Table <xref ref-type="table" rid="T3">3</xref>). The highest SNV/Kb were observed around the 5&#x02032;UTR, exon 2 and exon 5 regions in HLA-DQA1 and around exon 2 within HLA-DQB1. The HLA-DPA1 and HLA-DPB1 loci were well conserved among the class II genes with 28 and 22 indel numbers and 2.2 and 0.7 SNV/Kb, respectively (Table <xref ref-type="table" rid="T3">3</xref>). The 250 bp up-stream regions of the loci that include the transcription factor binding motifs were perfectly conserved among the alleles, although allelic variations in the transcription factor binding motifs were observed within some of the other HLA loci (data not shown).</p>
<p>The HLA-DPA1 and HLA-DPB1 allele sequences were separated into two distinct divergent groups, the DP2 and DP5 (<xref ref-type="bibr" rid="B46">46</xref>). The nucleotide diversity profiles of the HLA-DPA1 (Figure <xref ref-type="supplementary-material" rid="SM9">S2G</xref>) and HLA-DPB1 (Figure <xref ref-type="fig" rid="F3">3A1</xref>) showed unusually low diversity patterns when compared to the other HLA class II loci (Table <xref ref-type="table" rid="T3">3</xref> and Figures <xref ref-type="supplementary-material" rid="SM9">S2D</xref>&#x02013;<xref ref-type="supplementary-material" rid="SM9">F</xref>). Although the diversity patterns of the different HLA class II loci revealed the presence of a high SNV/Kb throughout the gene regions (2.2&#x02013;5.3/Kb) and high SNV densities in the polymorphic exons (Figures <xref ref-type="supplementary-material" rid="SM9">S2D</xref>&#x02013;<xref ref-type="supplementary-material" rid="SM9">F</xref>), the HLA-DPB1 nucleotide diversity profiles of the DP2 and DP5 groups included SNV/Kb of 0.3 for the 5.5 kb region between the promoter-enhancer and exon 2 (Segment 1) and 1.0 for the 6.6 kb region between intron 2 and the 3&#x02032;UTR (Segment 2) (Figure <xref ref-type="fig" rid="F3">3A1</xref>).</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Nucleotide diversity and phylogenetic analyses using the HLA-DPB1 allele sequences. <bold>(A)</bold> Nucleotide diversity profiles were constructed using three nucleotide alignments, 12,306 bp (whole gene region), 5,551 bp (segment 1), and 6,755 bp (segment 2). The nucleotide lengths (bp) are shown with indels (no parenthesis) and without indels (in parenthesis). The A1, A2, and A3 matrix windows show the diversity profiles using 38 HLA-DPB1 alleles (18 DP2 group alleles and 20 DP5 group alleles), except for two recombinant alleles, DPB1<sup>&#x0002A;</sup>17:01:01:01 and DPB1<sup>&#x0002A;</sup>19:01:01:01. The red peak and valley profiles within the matrix windows indicate the changes in SNV/Kb across the aligned sequences and the black bars indicate indel numbers among the alleles. The average SNV/Kb for the sequence alignment is shown on the top line of each matrix window. <bold>(B)</bold> Phylogenetic trees using the 19 representative HLA-DPB1 alleles were constructed by the Neighbor-Joining method. The three phylogenetic trees (B1&#x02013;B3) represent the 12,147 bp nucleotide alignment of HLA-DPB1 whole gene region (B1), the 5,542 bp nucleotide alignment of the enhancer-promoter region to exon 2 (B2), and the 6,605 bp nucleotide alignment of the intron 2&#x02013;3&#x02032;UTR region (B3). Red letters and backgrounds indicate the DP2 group (rs9277534: A) and blue letters and backgrounds indicate the DP5 group (rs9277534: G) alleles. Numbers on the branches are bootstrap support values.</p></caption>
<graphic xlink:href="fimmu-09-02294-g0003.tif"/>
</fig>
<p>The HLA-DPB1 variation at rs9277534 has been associated with HLA-DPB1 expression levels, whereby high expression was associated with rs9277534G and low expression was associated with rs9277534A (<xref ref-type="bibr" rid="B20">20</xref>). Because the rs9277534 site was located in the 3&#x02032;UTR region of our HLA-DPB1 allele sequences, we grouped the rs9277534G with DP5 and rs9277534A with DP2, excluding two recombinant alleles, DPB1<sup>&#x0002A;</sup>17:01:01:01 and DPB1<sup>&#x0002A;</sup>19:01:01:01. By comparing various allelic sequences, we deduced that DPB1<sup>&#x0002A;</sup>17:01:01:01 in the DP2 group and DPB1<sup>&#x0002A;</sup>19:01:01:01 in the DP5 group were generated by recombination events in intron 2 of the DPB1<sup>&#x0002A;</sup>02:01:02:01 and DPB1<sup>&#x0002A;</sup>05:01:01:01 alleles (Figure <xref ref-type="supplementary-material" rid="SM10">S3</xref>).</p>
<p>We also compared the nucleotide diversity of the DP2 against DP5 and found that the SNV/Kb were markedly reduced in both the DP2 and DP5 groups with 0.4 and 0.5 in segment 1 and 0.04 and 0.3 in the segment 2, respectively (Figures <xref ref-type="fig" rid="F3">3A2,A3</xref>). The SNV/Kb in both of these segments were lower than those for all the alleles across the whole gene region (Figure <xref ref-type="fig" rid="F3">3A1</xref>). However, relatively high diversity was maintained within exon 2 of both DP groups, and the polymorphisms of exon 2 appear to have evolved independently of the DP2 and DP5 structures. This hypothesis is supported by the phylogenetic analyses of the HLA-DPB1 allele sequences (Figure <xref ref-type="fig" rid="F3">3B</xref>), whereby the trees for Segments 1 and 2 (Figures <xref ref-type="fig" rid="F3">3B2,B3</xref>) showed similar phylogenies, excluding the recombinant alleles, and that the tree for Segment 2 (Figure <xref ref-type="fig" rid="F3">3B3</xref>) clearly separated into the DP2 and DP5 groups. However, most of the branches of Segment 1 are longer than those of Segment 2, which is consistent with the view that most of the polymorphisms or variations were generated in Segment 1.</p>
</sec>
<sec>
<title>Identification of novel SNVs and sequence region variations in DRB1<sup>&#x0002A;</sup>04 allele sequences previously associated with rheumatoid arthritis (RA)</title>
<p>We extended the sequences for four DRB1<sup>&#x0002A;</sup>04 alleles and identified novel intronic variants for five DRB1<sup>&#x0002A;</sup>04 alleles (Table <xref ref-type="supplementary-material" rid="SM7">S7</xref>) that could be separated into three rheumatoid arthritis (RA) categories based on the previous results of a case-control study using 1480 patients and 800 healthy controls in the Japanese population (<xref ref-type="bibr" rid="B47">47</xref>). All together, these were RA-susceptible alleles for DRB1<sup>&#x0002A;</sup>04:01:01:03, DRB1<sup>&#x0002A;</sup>04:05:01:01, DRB1<sup>&#x0002A;</sup>04:05:01:02, DRB1<sup>&#x0002A;</sup>04:05:01:03, and DRB1<sup>&#x0002A;</sup>04:10:03, RA-resistant alleles for DRB1<sup>&#x0002A;</sup>04:03:01:02, DRB1<sup>&#x0002A;</sup>04:06:01, and DRB1<sup>&#x0002A;</sup>04:07:01:02, and a RA-non-associated allele for DRB1<sup>&#x0002A;</sup>04:04:01. Although it has been previously shown that amino acid 74 in exon 2 (nucleotide position 8,563) correlates well with RA susceptibility, the extended intronic sequence information enabled us to identify in addition two positions in intron 2 correlating with RA susceptibility as well at nucleotide positions 9,139 and 9,304 of the sequence alignments using the DRB1<sup>&#x0002A;</sup>04 group sequences in the IPD-IMGT/HLA database after repeat sequence masking (Figure <xref ref-type="supplementary-material" rid="SM11">S4</xref> in <xref ref-type="supplementary-material" rid="SM8">Supplementary Material</xref>). The &#x0201C;A&#x0201D; allele at the position 9,304 was observed in the RA-susceptible alleles (DRB1<sup>&#x0002A;</sup>04:01:01:03, DRB1<sup>&#x0002A;</sup>04:05:01:01, DRB1<sup>&#x0002A;</sup>04:05:01:02, DRB1<sup>&#x0002A;</sup>04:05:01:03, and DRB1<sup>&#x0002A;</sup>04:10:03). The &#x0201C;G&#x0201D; allele was observed in the RA-resistant alleles (DRB1<sup>&#x0002A;</sup>04:03:01:02, DRB1<sup>&#x0002A;</sup>04:06:01, and DRB1<sup>&#x0002A;</sup>04:07:01:02). Interestingly, a deletion of two bases was observed in the other 32 HLA-DRB1 alleles. In addition, a microRNA (hsa-miR-7156-5p) was predicted to bind to the RA resistant allele sequences at the position 9,304, but not to the other allele sequences when we examined the miRbase (<ext-link ext-link-type="uri" xlink:href="http://www.mirbase.org">http://www.mirbase.org</ext-link>) using a microRNA target prediction software (Figure <xref ref-type="supplementary-material" rid="SM11">S4</xref>). In contrast to the allele at the position 9,304, the &#x0201C;A&#x0201D; allele at position 9,139 was observed in the RA-resistant alleles (DRB1<sup>&#x0002A;</sup>04:03:01:02, DRB1<sup>&#x0002A;</sup>04:06:01, and DRB1<sup>&#x0002A;</sup>04:07:01:02) and RA-non-association allele (DRB1<sup>&#x0002A;</sup>04:04:01), whereas the &#x0201C;G&#x0201D; allele was observed in the other 37 HLA-DRB1 alleles including the RA-susceptible alleles (Table <xref ref-type="table" rid="T4">4</xref>). Furthermore, Table <xref ref-type="table" rid="T4">4</xref> shows that while the presence of the polymorphic AluYK2 and L1PA4 retroelements (Figure <xref ref-type="fig" rid="F2">2</xref>) correlated with all the DRB1<sup>&#x0002A;</sup>04, the SNV at 9,139 and 9,304 differentiated between resistant and susceptible RA forms.</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Comparison of rheumatoid arthritis (RA)-susceptible, resistant and non-association alleles in the DRB1&#x0002A;04 group sequences.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left" style="border-bottom: thin solid #000000;" colspan="3"><bold>Statistical information of Oka et al. [</bold><xref ref-type="bibr" rid="B47"><bold>47</bold></xref><bold>]</bold></th>
<th valign="top" align="center"><bold>Allele name at the full-length level</bold></th>
<th valign="top" align="center" style="border-bottom: thin solid #000000;" colspan="8"><bold>Amino acid position in exon 2</bold></th>
<th valign="top" align="center" style="border-bottom: thin solid #000000;" colspan="2"><bold>Nucleotide position in intron 2</bold></th>
<th valign="top" align="center"><bold>Presence of AluYk2 in intron 1</bold></th>
<th valign="top" align="center"><bold>Presence of L1PA4 in intron 1</bold></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Allele name</bold></th>
<th valign="top" align="center"><bold><italic>P</italic>-value</bold></th>
<th valign="top" align="center"><bold>OR (95% CI)</bold></th>
<th/>
<th valign="top" align="center"><bold>67</bold></th>
<th valign="top" align="center"><bold>68</bold></th>
<th valign="top" align="center"><bold>69</bold></th>
<th valign="top" align="center"><bold>70</bold></th>
<th valign="top" align="center"><bold>71</bold></th>
<th valign="top" align="center"><bold>72</bold></th>
<th valign="top" align="center"><bold>73</bold></th>
<th valign="top" align="center"><bold>74</bold></th>
<th valign="top" align="center"><bold>9139</bold></th>
<th valign="top" align="center"><bold>9304</bold></th>
<th/>
<th/>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">DRB1&#x0002A;04:05</td>
<td valign="top" align="center">1.4 &#x000D7;<break/> 10e-36</td>
<td valign="top" align="center">3.3<break/> (2.73&#x02013;4.01)</td>
<td valign="top" align="center" style="color:#ee1c23">DRB1&#x0002A;04:05:01:01</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">E</td>
<td valign="top" align="center">Q</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">A</td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center"><bold>G</bold></td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center">(&#x0002B;)</td>
<td valign="top" align="center">(&#x0002B;)</td>
</tr>
<tr>
<td/>
<td/>
<td/>
<td valign="top" align="center" style="color:#ee1c23">DRB1&#x0002A;04:05:01:02</td>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td valign="top" align="center">(&#x0002B;)</td>
<td valign="top" align="center">(&#x0002B;)</td>
</tr>
<tr>
<td/>
<td/>
<td/>
<td valign="top" align="center" style="color:#ee1c23">DRB1&#x0002A;04:05:01:03</td>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td valign="top" align="center">(&#x0002B;)</td>
<td valign="top" align="center">(&#x0002B;)</td>
</tr>
<tr>
<td valign="top" align="left">DRB1&#x0002A;04:01</td>
<td valign="top" align="center">4.3 &#x000D7;<break/> 10e-5</td>
<td valign="top" align="center">2.8<break/> (1.63&#x02013;4.70)</td>
<td valign="top" align="center" style="color:#ee1c23">DRB1&#x0002A;04:01:01:03</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">E</td>
<td valign="top" align="center">Q</td>
<td valign="top" align="center">K</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">A</td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center"><bold>G</bold></td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center">(&#x0002B;)</td>
<td valign="top" align="center">(&#x0002B;)</td>
</tr>
<tr>
<td valign="top" align="left">DRB1&#x0002A;04:10</td>
<td valign="top" align="center">0.01</td>
<td valign="top" align="center">1.8<break/> (1.12&#x02013;3.02)</td>
<td valign="top" align="center" style="color:#ee1c23">DRB1&#x0002A;04:10:03</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">E</td>
<td valign="top" align="center">Q</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">A</td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center"><bold>G</bold></td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center">(&#x0002B;)</td>
<td valign="top" align="center">(&#x0002B;)</td>
</tr>
<tr style="border-top: thin solid #000000;">
<td valign="top" align="center">DRB1&#x0002A;04:06</td>
<td valign="top" align="center">0.0005</td>
<td valign="top" align="center">0.5<break/> (0.35&#x02013;0.74)</td>
<td valign="top" align="center" style="color:#2e3092">DRB1&#x0002A;04:06:01</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">E</td>
<td valign="top" align="center">Q</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">A</td>
<td valign="top" align="center"><bold>E</bold></td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center"><bold>G</bold></td>
<td valign="top" align="center">(&#x0002B;)</td>
<td valign="top" align="center">(&#x0002B;)</td>
</tr>
<tr>
<td valign="top" align="left">DRB1&#x0002A;04:03</td>
<td valign="top" align="center">0.0012</td>
<td valign="top" align="center">0.5<break/> (0.30&#x02013;0.74)</td>
<td valign="top" align="center" style="color:#2e3092">DRB1&#x0002A;04:03:01:02</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">E</td>
<td valign="top" align="center">Q</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">A</td>
<td valign="top" align="center"><bold>E</bold></td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center"><bold>G</bold></td>
<td valign="top" align="center">(&#x0002B;)</td>
<td valign="top" align="center">(&#x0002B;)</td>
</tr>
<tr>
<td valign="top" align="left">DRB1&#x0002A;04:07</td>
<td valign="top" align="center">0.0001</td>
<td valign="top" align="center">0.1<break/> (0.05&#x02013;0.43)</td>
<td valign="top" align="center" style="color:#2e3092">DRB1<sup>&#x0002A;</sup>04:07:01:02</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">E</td>
<td valign="top" align="center">Q</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">A</td>
<td valign="top" align="center"><bold>E</bold></td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="center"><bold>G</bold></td>
<td valign="top" align="center">(&#x0002B;)</td>
<td valign="top" align="center">(&#x0002B;)</td>
</tr>
<tr style="border-top: thin solid #000000;">
<td valign="top" align="center">Other alleles</td>
<td/>
<td/>
<td/>
<td valign="top" align="center">LIF</td>
<td valign="top" align="center">L</td>
<td valign="top" align="center">E</td>
<td valign="top" align="center">QRD</td>
<td valign="top" align="center">RKEA</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">AG</td>
<td valign="top" align="center">AEQLR</td>
<td valign="top" align="center"><bold>G</bold></td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>RA-susceptible (red) and resistant (blue) alleles are shown in this table. Amino acid and nucleotide positions are bases on the sequence alignment tool of the IPD-IMGT/HLA database (<ext-link ext-link-type="uri" xlink:href="https://www.ebi.ac.uk/ipd/imgt/hla/align.html">https://www.ebi.ac.uk/ipd/imgt/hla/align.html</ext-link>) using the DRB1<sup>&#x0002A;</sup>04 group sequences shown in Figure <xref ref-type="supplementary-material" rid="SM11">S4</xref> in <xref ref-type="supplementary-material" rid="SM8">Supplementary Material</xref>. The Bold letter indicates a difference of the amino acid or nucleotide sequence between the RA susceptible and resistant alleles. Amino acid positions in the exon 2 were referred from (<xref ref-type="bibr" rid="B47">47</xref>&#x02013;<xref ref-type="bibr" rid="B51">51</xref>)</italic>.</p>
</table-wrap-foot>
</table-wrap>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>In this study, a total of 253 full-length HLA allele sequences were determined from 46 healthy subjects with a cumulative frequency of more than 99.2% (ranging from HLA-DQA1: 99.2% to HLA-DQB1: 100%) in the Japanese population (Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). Of this collection of reference sequences, 50.8% were characterized to be novel and extended alleles (Table <xref ref-type="table" rid="T1">1</xref>), and of these, 67.2% (309 alleles/460 alleles) of class II alleles were novel or extended. Only three of the novel HLA alleles were non-synonymous substitutions and they were within exon 1 of B<sup>&#x0002A;</sup>15:428, exon 3 of DPA1<sup>&#x0002A;</sup>02:07:01:01, and exon 4 of DPA1<sup>&#x0002A;</sup>02:08 (Table <xref ref-type="table" rid="T2">2</xref>). While we focused in this study on producing a full-length HLA reference set for the Japanese population, others have used the PacBio sequencing technologies to determine the full-length HLA allele sequences at six classical loci for 126 International HLA and Immunogenetics Workshop cell lines (<xref ref-type="bibr" rid="B52">52</xref>) and the full-length characterisation of 1056 HLA alleles (<xref ref-type="bibr" rid="B53">53</xref>). Together, these two-separate long-range PacBio sequencing studies have provided a new set of fully characterized full-length HLA allele reference sequences for future large-scale analyses that can be expected to yield additional novel alleles and lead to more accurate HLA genotyping using cheaper and better conventional methods and strategies.</p>
<p>We used both the PacBio and the Ion PGM sequencing technologies to determine the full-length HLA allele genomic sequences that now represent our collection of Japanese reference alleles for coding and non-coding sequences assigned up to the field-4 level to improve future use in routine genotyping. HLA alleles can only be resolved to the field-4 level if the entire gene is sequenced, whereas exonic sequencing is limited to only the field-2 or field-3 level and not beyond. However, unique alleles that have no variants and have been fully sequenced (exons and non-coding regions) also may be identified only to the field-2 level of resolution (such as B<sup>&#x0002A;</sup>15:428 identified in this study) because the field-3 and field-4 identifiers are omitted from the 4-field identification code of allelic resolution. Therefore, the use of the official HLA nomenclature to only the field-2 level of allelic resolution can be confusing because it might imply that either the allele is unique with no sequence variants or that the allele has been sequenced only to the exonic level and that it has not included any of the non-coding sequences. Although it is normally understood that a unique and fully sequenced HLA allele with no sequence variation will be identified only to the 2-level of resolution without the need to add on the field-3 or field-4 identifiers (e.g., B<sup>&#x0002A;</sup>15:428), it might be better to also add them even to the unique alleles in order to avoid confusion, (e.g., B<sup>&#x0002A;</sup>15:428:0:0). The usual omission of the field- 3 and field-4 identifiers from some alleles may need to be changed in the future to distinguish between the fully sequenced unique alleles and the partially exonic-sequenced genes with no non-coding sequence data (e.g., B<sup>&#x0002A;</sup>15:428:-: -). If there are one or more allelic variants with differences in the non-coding sequences then by definition these allelic variants will be identified to the field-4 level of resolution by also including the field-1, field-2, and field-3 identifiers (e.g., B<sup>&#x0002A;</sup>15:428:0:1).</p>
<p>In comparing, the PacBio and the Ion PGM sequencing technologies, we found both methods had their particular limitations with allele misreads and &#x0201C;drop-outs&#x0201D; and problems with homopolymers, four &#x0201C;drop-out&#x0201D; alleles and one mismatched allele were detected in the PacBio data after a comprehensive nucleotide similarity search (Table <xref ref-type="supplementary-material" rid="SM5">S5</xref>). These &#x0201C;artifactual&#x0201D; alleles were likely the result of using low-quality nucleotide subreads during the construction of the consensus sequences. The concordance rate between the PacBio consensus sequences and the finally determined nucleotide sequences (concordance rate &#x0003D; sum of correct allele length (bp) from the PacBio consensus sequences /sum of all allele length (bp) from the finally determined nucleotide sequences &#x000D7; 100) was 99.985% for the eight HLA loci with the mismatched alleles. The concordance rates for the class I loci composed of comparatively short PCR amplicons and the class II loci consisting of relatively longer PCR amplicons were 99.999 and 99.987%, respectively. The largest nucleotide differences were observed for HLA-DPA1 (99.976% similarity) and HLA-DRB1 (99.976% similarity) possibly due to the low amount of DNA used for the PacBio library construction of HLA-DPA1 and the resultant output of subreads of specific HLA-DRB1 alleles that had allelic imbalances generated by the long-range PCR. On the other hand, the concordance rate was 100% in the HLA-C locus for which the mean and minimum subreads per sample were 554 and 424, respectively (Table <xref ref-type="supplementary-material" rid="SM3">S3</xref>). In previous studies of HLA genotyping by second-generation NGS, we found that the determination of the full-length HLA allele sequences was difficult in the HLA-DQA1, HLA-DPA1, and HLA-DPB1 loci because the SNPs and indel densities that were used to separate the chromosomal phases were much lower than in the other HLA loci (<xref ref-type="bibr" rid="B24">24</xref>). However, construction of the consensus sequences for the three HLA class II loci using PacBio sequencing was extremely helpful for improving the characterization and classification of HLA allele sequences from the short-reads generated by Ion Torrent and Sanger sequencing. In this regard, PacBio sequencing is a helpful tool for providing reliable and accurate HLA allele sequences if enough high-quality subreads (minimum subread number of more than 300 and average subread number of more than 500) can be provided for the construction of the consensus sequences.</p>
<p>We also encountered problems with some microsatellite and mono-stretch sequences using both technologies, especially for HLA-DRB1 with the complexity of microsatellite polymorphisms in intron 2. Because sequencing errors due to the presence of microsatellite polymorphisms and mono-stretch sequences, either <italic>in vivo</italic> or generated <italic>in vitro</italic> by PCR, will be observed frequently in future, the problematic sequencing sites should be included in the HLA allele definitions such as DRB1<sup>&#x0002A;</sup>15:01:01:01/02/03.</p>
<p>Overall, we obtained highly accurate HLA allele long-read sequences in most of the PCR regions using PacBio SMRT sequencing without a need to confirm the alleles by also using second-generation sequencing. We could have checked some ambiguous nucleotides and newly discovered variations by using Sanger sequencing instead of the second-generation sequencing method. However, the running cost for PacBio SMRT sequencing is collectively higher than for second-generation sequencing.</p>
<p>Although peptide presentation preferences are the key factor influencing disease susceptibility [(<xref ref-type="bibr" rid="B47">47</xref>) and Table <xref ref-type="table" rid="T4">4</xref>], other factors such as miRNA sequence variants within the coding and noncoding regions are emerging as potential and previously unknown influencing factors (<xref ref-type="bibr" rid="B54">54</xref>). The previous limitation to characterize full-length HLA alleles can be overcome more easily by using third-generation sequencing methods in addition to traditional typing methods to produce more accurate HLA typing results. An advantage of our full-length HLA gene-sequencing protocol is that it generated 5&#x02032; and 3&#x02032; non-coding and intronic non-coding sequences that often are ignored, as well as providing the coding sequences that usually are used to characterize and classify HLA polymorphisms and investigate their associations with disease and transplantation. The polymorphisms and diversity of HLA non-coding sequences is additional beneficial information because non-coding sequences have regulatory roles in gene expression (<xref ref-type="bibr" rid="B55">55</xref>, <xref ref-type="bibr" rid="B56">56</xref>) such as producing or interacting with regulatory microRNA (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B54">54</xref>) and regulatory retrotransposons (<xref ref-type="bibr" rid="B57">57</xref>, <xref ref-type="bibr" rid="B58">58</xref>). The HLA non-coding SNPs have been associated with disease and regulation of infection such as the SNP in the 3&#x02032;UTR of HLA-C associated to plasma HIV copy number (<xref ref-type="bibr" rid="B19">19</xref>) and the SNP in the 3&#x02032;UTR of HLA-DPB1 associated to acute GVHD (<xref ref-type="bibr" rid="B20">20</xref>). In this study, by comparing all the aligned DRB1<sup>&#x0002A;</sup>04 allele sequences, we identified new variations that may be related to RA susceptibility and resistance throughout the whole gene regions including a previously &#x0201C;undetermined region.&#x0201D; Within the group of DRB1<sup>&#x0002A;</sup>04 alleles certain shared epitopes at AA 70&#x02013;74 have been associated with RA susceptibility (QRRAA, QKRAA) or resistance (QRRAE). In addition to these known associations, we identified two SNVs (SNV 9,139 and SNV 9,304) in intron 2 correlating with RA susceptibility. Although these non-coding SNVs are still under further investigation and their associations with RA need to be validated in comparative studies using RA patients and healthy subjects, it is evident that HLA-related disease analysis using the full-length HLA-gene sequences provides a new opportunity for the discovery of novel disease-related variations in the highly polymorphic HLA genes.</p>
<p>We undertook a comparative nucleotide analysis of the coding and the non-coding regions of all the HLA allele sequences and mapped their SNV and indel differences (Figure <xref ref-type="supplementary-material" rid="SM9">S2</xref>). We focused on the nucleotide diversity of the HLA-DPB1 sequences and found that there are no nucleotide differences among the alleles in the promoter-enhancer region (data not shown), but that 2.8 SNV/Kb on average were identified across the entire gene allelic sequences and that 4 SNV/Kb were identified in the non-coding regions between intron 2 and the 3&#x02032;UTR region (Segment 2 of Figure <xref ref-type="fig" rid="F3">3A1</xref>). Phylogenetic analysis of all the HLA-DPB1 allelic sequences separated them into DP2 and DP5, two distinct groups that were previously described by phylogeny of peptide binding sequences and other evolutionary markers (<xref ref-type="bibr" rid="B46">46</xref>). Although the allele-specific polymorphisms observed in exon 2 appear to have been generated independently of the DP2 and DP5 subgroups, the SNV rs9277534 within the 3&#x02032;UTR that was associated with the regulation of HLA-DPB1 gene expression (<xref ref-type="bibr" rid="B20">20</xref>) also was associated strongly with one or other of the two DP groups. The high expression rs9277534G grouped within DP5, whereas the low expression rs9277534A grouped within DP2. The role of this rs9277534 SNV in gene expression is important because it may provoke acute GVHD after unrelated hematopoietic cell transplantation (UR-HCT) in a different manner from the T-cell epitope (TCE) mismatching algorithm (<xref ref-type="bibr" rid="B59">59</xref>), reflecting exon 2 polymorphisms and structural differences of HLA-DP molecules between patient and donor and affect acute GVHD in HLA-DPB1 mismatched UR-HCT (<xref ref-type="bibr" rid="B60">60</xref>). Although phylogenetic trees of the 12,149 bp for whole gene region, the 2,668 bp from exon 3 to 3&#x02032;UTR and the 264 bp for exon 2 were published previously (<xref ref-type="bibr" rid="B60">60</xref>), our present study has advanced the previous findings because we identified a genomic boundary between the DP2 and DP5 groups from the 19 HLA-DPB1 allele sequences.</p>
<p>In the present study, we used the computing program RepeatMasker to search for and identify novel retrotransposons in our full-length HLA-DRB1 sequences that could be useful polymorphic indel markers for investigating the evolution of ancestral haplotypes or be associated with diseases. We found DR-type specific indels of SINE, LINE, Medium reiterated repeat (MER) and Long terminal repeat (LTR) sequences that were mainly located within the introns 1, 2, and 5 of the HLA-DRB1 sequences. These findings on HLA retroelement indel polymorphisms complement and expand on the previous results of others (<xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B61">61</xref>).</p>
</sec>
<sec sec-type="conclusions" id="s5">
<title>Conclusion</title>
<p>We determined, characterized and reclassified 253 full-length HLA allele sequences using both the third-generation SMRT and the second-generation Ion Torrent NGS technologies. These newly generated and classified reference sequences will help to genotype HLA genes to the full-length level and to accurately identify rare, novel and null alleles, which in turn should help to provide new information and knowledge for future population genetics, HLA-related disease, and transplantation studies. Finally, a much greater collection of high-quality, fully characterized full-length HLA allele sequences should be determined worldwide in many different populations.</p>
</sec>
<sec id="s6">
<title>Data availability</title>
<p>The HLA allele sequences are available in GenBank/DDBJ/ENBL-EBI DNA databases and IPD-IMGT/HLA database. The detail information such as the accession numbers and official HLA allele names are indicated in the Table <xref ref-type="supplementary-material" rid="SM7">S7</xref>.</p>
</sec>
<sec id="s7">
<title>Ethics statement</title>
<p>The study protocol was approved from the institutional review board of the Japan Marrow Donor Program (JMDP) and Tokai University (Application number: 15I-04) and informed consents were obtained from donors in accordance with the Declaration of Helsinki.</p>
</sec>
<sec id="s8">
<title>Author contributions</title>
<p>SS, TS, and SR designed, set up some of the approaches, and carried out most of the experiments. JH analyzed the data. SI, AS, AM, JH, PB, and MK were involved in nucleotide sequencing. YO, AO, JS, SM, YM, and HI designed and supported the study. SS, TS, KO, and JK performed analysis and wrote the paper. All authors checked the final version of the paper.</p>
<sec>
<title>Conflict of interest statement</title>
<p>SR, JH and PB are employees of Pacific Biosciences, KO, MK and JS are employees of Tomy Digital Biology, and AM and HI are employees of GenoDive Pharma. The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</sec>
</body>
<back>
<ack><p>We thank the Japan Marrow Donor Program office.</p>
</ack><sec sec-type="supplementary-material" id="s9">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fimmu.2018.02294/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fimmu.2018.02294/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.XLSX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_3.XLSX" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_4.XLSX" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_5.XLSX" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_6.XLSX" id="SM6" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_7.XLSX" id="SM7" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Presentation_1.PPTX" id="SM8" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Presentation_2.PPTX" id="SM9" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Presentation_3.PPTX" id="SM10" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Presentation_4.pdf" id="SM11" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Kulski</surname> <given-names>JK</given-names></name> <name><surname>Inoko</surname> <given-names>H</given-names></name></person-group>. <article-title>Major Histocompatibility Complex (MHC) genes</article-title>. In <person-group person-group-type="editor"><name><surname>Cooper</surname> <given-names>DN</given-names></name></person-group>, editor. <source>National Encyclopedia of the Human Genome</source>. Vol. <volume>3</volume>. <publisher-loc>London</publisher-loc>: <publisher-name>John Wiley &#x00026; Sons, Inc.</publisher-name> (<year>2003</year>). p. <fpage>778</fpage>&#x02013;<lpage>85</lpage>.</citation></ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thorsby</surname> <given-names>E</given-names></name></person-group>. <article-title>A short history of HLA</article-title>. <source>Tissue Antigens</source> (<year>2009</year>) <volume>74</volume>:<fpage>101</fpage>&#x02013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1111/j.1399-0039.2009.01291.x</pub-id><pub-id pub-id-type="pmid">19523022</pub-id></citation></ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zinkernagel</surname> <given-names>RM</given-names></name> <name><surname>Doherty</surname> <given-names>PC</given-names></name></person-group>. <article-title>The discovery of MHC restriction</article-title>. <source>Immunol Today</source> (<year>1997</year>) <volume>18</volume>:<fpage>14</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="pmid">9018968</pub-id></citation></ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sasazuki</surname> <given-names>T</given-names></name> <name><surname>Juji</surname> <given-names>T</given-names></name> <name><surname>Morishima</surname> <given-names>Y</given-names></name> <name><surname>Kinukawa</surname> <given-names>N</given-names></name> <name><surname>Kashiwabara</surname> <given-names>H</given-names></name> <name><surname>Inoko</surname> <given-names>H</given-names></name> <etal/></person-group>. <article-title>Effect of matching of class I HLA alleles on clinical outcome after transplantation of hematopoietic stem cells from an unrelated donor. Japan Marrow Donor Program</article-title>. <source>N Eng J Med.</source> (<year>1998</year>) <volume>339</volume>:<fpage>1177</fpage>&#x02013;<lpage>85</lpage>. <pub-id pub-id-type="pmid">9780337</pub-id></citation></ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mungall</surname> <given-names>AJ</given-names></name> <name><surname>Palmer</surname> <given-names>SA</given-names></name> <name><surname>Sims</surname> <given-names>SK</given-names></name> <name><surname>Edwards</surname> <given-names>CA</given-names></name> <name><surname>Ashurst</surname> <given-names>JL</given-names></name> <name><surname>Wilming</surname> <given-names>L</given-names></name> <etal/></person-group>. <article-title>The DNA sequence and analysis of human chromosome 6</article-title>. <source>Nature</source> (<year>2003</year>) <volume>425</volume>:<fpage>805</fpage>&#x02013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1038/nature02055</pub-id><pub-id pub-id-type="pmid">14574404</pub-id></citation></ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shiina</surname> <given-names>T</given-names></name> <name><surname>Inoko</surname> <given-names>H</given-names></name> <name><surname>Kulski</surname> <given-names>JK</given-names></name></person-group>. <article-title>An update of the HLA genomic region, locus information and disease associations: 2004</article-title>. <source>Tissue Antigens</source> (<year>2004</year>) <volume>64</volume>:<fpage>631</fpage>&#x02013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1111/j.1399-0039.2004.00327.x</pub-id><pub-id pub-id-type="pmid">15546336</pub-id></citation></ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shiina</surname> <given-names>T</given-names></name> <name><surname>Hosomichi</surname> <given-names>K</given-names></name> <name><surname>Inoko</surname> <given-names>H</given-names></name> <name><surname>Kulski</surname> <given-names>JK</given-names></name></person-group>. <article-title>The HLA genomic loci map: expression, interaction, diversity and disease</article-title>. <source>J Hum Genet.</source> (<year>2009</year>) <volume>54</volume>:<fpage>15</fpage>&#x02013;<lpage>39</lpage>. <pub-id pub-id-type="doi">10.1038/jhg.2008.5</pub-id><pub-id pub-id-type="pmid">19158813</pub-id></citation></ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Trowsdale</surname> <given-names>J</given-names></name> <name><surname>Knight</surname> <given-names>JC</given-names></name></person-group>. <article-title>Major histocompatibility complex genomics and human disease</article-title>. <source>Ann Rev Genomics Hum Genet.</source> (<year>2013</year>) <volume>14</volume>:<fpage>301</fpage>&#x02013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-genom-091212-153455</pub-id><pub-id pub-id-type="pmid">23875801</pub-id></citation></ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ota</surname> <given-names>M</given-names></name> <name><surname>Seki</surname> <given-names>T</given-names></name> <name><surname>Fukushima</surname> <given-names>H</given-names></name> <name><surname>Tsuji</surname> <given-names>K</given-names></name> <name><surname>Inoko</surname> <given-names>H</given-names></name></person-group>. <article-title>HLA-DRB1 genotyping by modified PCR-RFLP method combined with group-specific primers</article-title>. <source>Tissue Antigens</source> (<year>1992</year>) <volume>39</volume>:<fpage>187</fpage>&#x02013;<lpage>202</lpage>. <pub-id pub-id-type="pmid">1356282</pub-id></citation></ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arguello</surname> <given-names>JR</given-names></name> <name><surname>Madrigal</surname> <given-names>JA</given-names></name></person-group>. <article-title>HLA typing by Reference Strand Mediated Conformation Analysis (RSCA)</article-title>. <source>Rev Immunogenet.</source> (<year>1999</year>) <volume>1</volume>:<fpage>209</fpage>&#x02013;<lpage>19</lpage>. <pub-id pub-id-type="pmid">11253947</pub-id></citation></ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saiki</surname> <given-names>RK</given-names></name> <name><surname>Walsh</surname> <given-names>PS</given-names></name> <name><surname>Levenson</surname> <given-names>CH</given-names></name> <name><surname>Erlich</surname> <given-names>HA</given-names></name></person-group>. <article-title>Genetic analysis of amplified DNA with immobilized sequence-specific oligonucleotide probes</article-title>. <source>Proc Natl Acad Sci USA.</source> (<year>1989</year>) <volume>86</volume>:<fpage>6230</fpage>&#x02013;<lpage>4</lpage>. <pub-id pub-id-type="pmid">2762325</pub-id></citation></ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Olerup</surname> <given-names>O</given-names></name> <name><surname>Zetterquist</surname> <given-names>H</given-names></name></person-group>. <article-title>HLA-DR typing by PCR amplification with sequence-specific primers (PCR-SSP) in 2 hours: an alternative to serological DR typing in clinical practice including donor-recipient matching in cadaveric transplantation</article-title>. <source>Tissue Antigens</source> (<year>1992</year>) <volume>39</volume>:<fpage>225</fpage>&#x02013;<lpage>35</lpage>. <pub-id pub-id-type="pmid">1357775</pub-id></citation></ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Santamaria</surname> <given-names>P</given-names></name> <name><surname>Lindstrom</surname> <given-names>AL</given-names></name> <name><surname>Boyce-Jacino</surname> <given-names>MT</given-names></name> <name><surname>Myster</surname> <given-names>SH</given-names></name> <name><surname>Barbosa</surname> <given-names>JJ</given-names></name> <name><surname>Faras</surname> <given-names>AJ</given-names></name> <etal/></person-group>. <article-title>HLA class I sequence-based typing</article-title>. <source>Hum Immunol.</source> (<year>1993</year>) <volume>37</volume>:<fpage>39</fpage>&#x02013;<lpage>50</lpage>. <pub-id pub-id-type="pmid">8376187</pub-id></citation></ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sheldon</surname> <given-names>S</given-names></name> <name><surname>Poulton</surname> <given-names>K</given-names></name></person-group>. <article-title>HLA typing and its influence on organ transplantation</article-title>. <source>Methods Mol Biol.</source> (<year>2006</year>) <volume>333</volume>:<fpage>157</fpage>&#x02013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.1385/1-59745-049-9:157</pub-id><pub-id pub-id-type="pmid">16790851</pub-id></citation></ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mahdi</surname> <given-names>BM</given-names></name></person-group>. <article-title>A glow of HLA typing in organ transplantation</article-title>. <source>Clin Transl Med.</source> (<year>2013</year>) <volume>2</volume>:<fpage>6</fpage>. <pub-id pub-id-type="doi">10.1186/2001-1326-2-6</pub-id><pub-id pub-id-type="pmid">23432791</pub-id></citation></ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Erlich</surname> <given-names>HA</given-names></name> <name><surname>Opelz</surname> <given-names>G</given-names></name> <name><surname>Hansen</surname> <given-names>J</given-names></name></person-group>. <article-title>HLA DNA typing and transplantation</article-title>. <source>Immunity</source> (<year>2001</year>) <volume>14</volume>:<fpage>347</fpage>&#x02013;<lpage>56</lpage>. <pub-id pub-id-type="doi">10.1016/S1074-7613(01)00115-7</pub-id><pub-id pub-id-type="pmid">11336680</pub-id></citation></ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Adams</surname> <given-names>SD</given-names></name> <name><surname>Barracchini</surname> <given-names>KC</given-names></name> <name><surname>Chen</surname> <given-names>D</given-names></name> <name><surname>Robbins</surname> <given-names>F</given-names></name> <name><surname>Wang</surname> <given-names>L</given-names></name> <name><surname>Larsen</surname> <given-names>P</given-names></name> <etal/></person-group>. <article-title>Ambiguous allele combinations in HLA Class I and Class II sequence-based typing: when precise nucleotide sequencing leads to imprecise allele identification</article-title>. <source>J Transl Med.</source> (<year>2004</year>) <volume>2</volume>:<fpage>30</fpage>. <pub-id pub-id-type="doi">10.1186/1479-5876-2-30</pub-id><pub-id pub-id-type="pmid">15363110</pub-id></citation></ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lind</surname> <given-names>C</given-names></name> <name><surname>Ferriola</surname> <given-names>D</given-names></name> <name><surname>Mackiewicz</surname> <given-names>K</given-names></name> <name><surname>Heron</surname> <given-names>S</given-names></name> <name><surname>Rogers</surname> <given-names>M</given-names></name> <name><surname>Slavich</surname> <given-names>L</given-names></name> <etal/></person-group>. <article-title>Next-generation sequencing: the solution for high-resolution, unambiguous human leukocyte antigen typing</article-title>. <source>Hum Immunol.</source> (<year>2010</year>) <volume>71</volume>:<fpage>1033</fpage>&#x02013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1016/j.humimm.2010.06.016</pub-id><pub-id pub-id-type="pmid">20603174</pub-id></citation></ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kulkarni</surname> <given-names>S</given-names></name> <name><surname>Savan</surname> <given-names>R</given-names></name> <name><surname>Qi</surname> <given-names>Y</given-names></name> <name><surname>Gao</surname> <given-names>X</given-names></name> <name><surname>Yuki</surname> <given-names>Y</given-names></name> <name><surname>Bass</surname> <given-names>SE</given-names></name> <etal/></person-group>. <article-title>Differential microRNA regulation of HLA-C expression and its association with HIV control</article-title>. <source>Nature</source> (<year>2011</year>) <volume>472</volume>:<fpage>495</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1038/nature09914</pub-id><pub-id pub-id-type="pmid">21499264</pub-id></citation></ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Petersdorf</surname> <given-names>EW</given-names></name> <name><surname>Malkki</surname> <given-names>M</given-names></name> <name><surname>O&#x00027;HUigin</surname> <given-names>C</given-names></name> <name><surname>Carrington</surname> <given-names>M</given-names></name> <name><surname>Gooley</surname> <given-names>T</given-names></name> <name><surname>Haagenson</surname> <given-names>MD</given-names></name> <etal/></person-group>. <article-title>High HLA-DP expression and graft-versus-host disease</article-title>. <source>N Eng J Med.</source> (<year>2015</year>) <volume>373</volume>:<fpage>599</fpage>&#x02013;<lpage>609</lpage>. <pub-id pub-id-type="doi">10.1056/NEJMoa1500140</pub-id><pub-id pub-id-type="pmid">26267621</pub-id></citation></ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ramsuran</surname> <given-names>V</given-names></name> <name><surname>Kulkarni</surname> <given-names>S</given-names></name> <name><surname>O&#x00027;Huigin</surname> <given-names>C</given-names></name> <name><surname>Yuki</surname> <given-names>Y</given-names></name> <name><surname>Augusto</surname> <given-names>DG</given-names></name> <name><surname>Gao</surname> <given-names>X</given-names></name> <etal/></person-group>. <article-title>Epigenetic regulation of differential HLA-A allelic expression levels</article-title>. <source>Hum Mol Genet.</source> (<year>2015</year>) <volume>24</volume>:<fpage>4268</fpage>&#x02013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.1093/hmg/ddv158</pub-id><pub-id pub-id-type="pmid">25935001</pub-id></citation></ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Robinson</surname> <given-names>J</given-names></name> <name><surname>Soormally</surname> <given-names>AR</given-names></name> <name><surname>Hayhurst</surname> <given-names>JD</given-names></name> <name><surname>Marsh</surname> <given-names>SG</given-names></name></person-group>. <article-title>The IPD-IMGT/HLA database - new developments in reporting HLA variation</article-title>. <source>Hum Immunol.</source> (<year>2016</year>) <volume>77</volume>:<fpage>233</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1016/j.humimm.2016.01.020</pub-id><pub-id pub-id-type="pmid">26826444</pub-id></citation></ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hosomichi</surname> <given-names>K</given-names></name> <name><surname>Shiina</surname> <given-names>T</given-names></name> <name><surname>Tajima</surname> <given-names>A</given-names></name> <name><surname>Inoue</surname> <given-names>I</given-names></name></person-group>. <article-title>The impact of next-generation sequencing technologies on HLA research</article-title>. <source>J Hum Genet.</source> (<year>2015</year>) <volume>60</volume>:<fpage>665</fpage>&#x02013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1038/jhg.2015.102</pub-id><pub-id pub-id-type="pmid">26311539</pub-id></citation></ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shiina</surname> <given-names>T</given-names></name> <name><surname>Suzuki</surname> <given-names>S</given-names></name> <name><surname>Ozaki</surname> <given-names>Y</given-names></name> <name><surname>Taira</surname> <given-names>H</given-names></name> <name><surname>Kikkawa</surname> <given-names>E</given-names></name> <name><surname>Shigenari</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>Super high resolution for single molecule-sequence-based typing of classical HLA loci at the 8-digit level using next generation sequencers</article-title>. <source>Tissue Antigens</source> (<year>2012</year>) <volume>80</volume>:<fpage>305</fpage>&#x02013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1111/j.1399-0039.2012.01941.x</pub-id><pub-id pub-id-type="pmid">22861646</pub-id></citation></ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Kulski</surname> <given-names>JK</given-names></name> <name><surname>Suzuki</surname> <given-names>S</given-names></name> <name><surname>Ozaki</surname> <given-names>Y</given-names></name> <name><surname>Mitsunaga</surname> <given-names>S</given-names></name> <name><surname>Inoko</surname> <given-names>H</given-names></name> <name><surname>Shiina</surname> <given-names>T</given-names></name></person-group>. <article-title>In phase HLA genotyping by next generation sequencing &#x02013; a comparison between two massively parallel sequencing bench-top systems, the ROCHE GS junior and ion torrent PGM</article-title>. In: <person-group person-group-type="editor"><name><surname>Xi</surname> <given-names>Y</given-names></name></person-group>, editor. <source>HLA and Associated Important Diseases</source>. <publisher-loc>Croatia</publisher-loc>: <publisher-name>Intech</publisher-name> (<year>2014</year>). p. <fpage>141</fpage>&#x02013;<lpage>81</lpage>.</citation></ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ozaki</surname> <given-names>Y</given-names></name> <name><surname>Suzuki</surname> <given-names>S</given-names></name> <name><surname>Kashiwase</surname> <given-names>K</given-names></name> <name><surname>Shigenari</surname> <given-names>A</given-names></name> <name><surname>Okudaira</surname> <given-names>Y</given-names></name> <name><surname>Ito</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Cost-efficient multiplex PCR for routine genotyping of up to nine classical HLA loci in a single analytical run of multiple samples by next generation sequencing</article-title>. <source>BMC Genomics</source> (<year>2015</year>) <volume>16</volume>:<fpage>318</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-015-1514-4</pub-id><pub-id pub-id-type="pmid">25895492</pub-id></citation></ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>C</given-names></name> <name><surname>Krishnakumar</surname> <given-names>S</given-names></name> <name><surname>Wilhelmy</surname> <given-names>J</given-names></name> <name><surname>Babrzadeh</surname> <given-names>F</given-names></name> <name><surname>Stepanyan</surname> <given-names>L</given-names></name> <name><surname>Su</surname> <given-names>LF</given-names></name> <etal/></person-group>. <article-title>High-throughput, high-fidelity HLA genotyping with deep sequencing</article-title>. <source>Proc Natl Acad Sci USA.</source> (<year>2012</year>) <volume>109</volume>:<fpage>8676</fpage>&#x02013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1206614109</pub-id><pub-id pub-id-type="pmid">22589303</pub-id></citation></ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hosomichi</surname> <given-names>K</given-names></name> <name><surname>Jinam</surname> <given-names>TA</given-names></name> <name><surname>Mitsunaga</surname> <given-names>S</given-names></name> <name><surname>Nakaoka</surname> <given-names>H</given-names></name> <name><surname>Inoue</surname> <given-names>I</given-names></name></person-group>. <article-title>Phase-defined complete sequencing of the HLA genes by next-generation sequencing</article-title>. <source>BMC Genomics</source> (<year>2013</year>) <volume>14</volume>:<fpage>355</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-14-355</pub-id><pub-id pub-id-type="pmid">23714642</pub-id></citation></ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ehrenberg</surname> <given-names>PK</given-names></name> <name><surname>Geretz</surname> <given-names>A</given-names></name> <name><surname>Baldwin</surname> <given-names>KM</given-names></name> <name><surname>Apps</surname> <given-names>R</given-names></name> <name><surname>Polonis</surname> <given-names>VR</given-names></name> <name><surname>Robb</surname> <given-names>ML</given-names></name> <etal/></person-group>. <article-title>High-throughput multiplex HLA genotyping by next-generation sequencing using multi-locus individual tagging</article-title>. <source>BMC Genomics</source> (<year>2014</year>) <volume>15</volume>:<fpage>864</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-15-864</pub-id><pub-id pub-id-type="pmid">25283548</pub-id></citation></ref>
<ref id="B30">
<label>30.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname> <given-names>AG</given-names></name> <name><surname>Pyo</surname> <given-names>CW</given-names></name> <name><surname>Nelson</surname> <given-names>W</given-names></name> <name><surname>Gow</surname> <given-names>E</given-names></name> <name><surname>Wang</surname> <given-names>R</given-names></name> <name><surname>Shen</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Next generation sequencing to determine HLA class II genotypes in a cohort of hematopoietic cell transplant patients and donors</article-title>. <source>Human Immunol.</source> (<year>2014</year>) <volume>75</volume>:<fpage>1040</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1016/j.humimm.2014.08.206</pub-id><pub-id pub-id-type="pmid">25167774</pub-id></citation></ref>
<ref id="B31">
<label>31.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lange</surname> <given-names>V</given-names></name> <name><surname>Bohme</surname> <given-names>I</given-names></name> <name><surname>Hofmann</surname> <given-names>J</given-names></name> <name><surname>Lang</surname> <given-names>K</given-names></name> <name><surname>Sauter</surname> <given-names>J</given-names></name> <name><surname>Schone</surname> <given-names>B</given-names></name> <etal/></person-group>. <article-title>Cost-efficient high-throughput HLA typing by MiSeq amplicon sequencing</article-title>. <source>BMC Genomics</source> (<year>2014</year>) <volume>15</volume>:<fpage>63</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-15-63</pub-id><pub-id pub-id-type="pmid">24460756</pub-id></citation></ref>
<ref id="B32">
<label>32.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Duke</surname> <given-names>JL</given-names></name> <name><surname>Lind</surname> <given-names>C</given-names></name> <name><surname>Mackiewicz</surname> <given-names>K</given-names></name> <name><surname>Ferriola</surname> <given-names>D</given-names></name> <name><surname>Papazoglou</surname> <given-names>A</given-names></name> <name><surname>Gasiewski</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>Determining performance characteristics of an NGS-based HLA typing method for clinical applications</article-title>. <source>Hla</source> (<year>2016</year>) <volume>87</volume>:<fpage>141</fpage>&#x02013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1111/tan.12736</pub-id><pub-id pub-id-type="pmid">26880737</pub-id></citation></ref>
<ref id="B33">
<label>33.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eid</surname> <given-names>J</given-names></name> <name><surname>Fehr</surname> <given-names>A</given-names></name> <name><surname>Gray</surname> <given-names>J</given-names></name> <name><surname>Luong</surname> <given-names>K</given-names></name> <name><surname>Lyle</surname> <given-names>J</given-names></name> <name><surname>Otto</surname> <given-names>G</given-names></name> <etal/></person-group>. <article-title>Real-time DNA sequencing from single polymerase molecules</article-title>. <source>Science</source> (<year>2009</year>) <volume>323</volume>:<fpage>133</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1126/science.1162986</pub-id><pub-id pub-id-type="pmid">19023044</pub-id></citation></ref>
<ref id="B34">
<label>34.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Travers</surname> <given-names>KJ</given-names></name> <name><surname>Chin</surname> <given-names>CS</given-names></name> <name><surname>Rank</surname> <given-names>DR</given-names></name> <name><surname>Eid</surname> <given-names>JS</given-names></name> <name><surname>Turner</surname> <given-names>SW</given-names></name></person-group>. <article-title>A flexible and efficient template format for circular consensus sequencing and SNP detection</article-title>. <source>Nucleic Acids Res.</source> (<year>2010</year>) <volume>38</volume>:<fpage>e159</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkq543</pub-id><pub-id pub-id-type="pmid">20571086</pub-id></citation></ref>
<ref id="B35">
<label>35.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morishima</surname> <given-names>Y</given-names></name> <name><surname>Kashiwase</surname> <given-names>K</given-names></name> <name><surname>Matsuo</surname> <given-names>K</given-names></name> <name><surname>Azuma</surname> <given-names>F</given-names></name> <name><surname>Morishima</surname> <given-names>S</given-names></name> <name><surname>Onizuka</surname> <given-names>M</given-names></name> <etal/></person-group>. <article-title>Biological significance of HLA locus matching in unrelated donor bone marrow transplantation</article-title>. <source>Blood</source> (<year>2015</year>) <volume>125</volume>:<fpage>1189</fpage>&#x02013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2014-10-604785</pub-id><pub-id pub-id-type="pmid">25519752</pub-id></citation></ref>
<ref id="B36">
<label>36.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vogel</surname> <given-names>U</given-names></name> <name><surname>Szczepanowski</surname> <given-names>R</given-names></name> <name><surname>Claus</surname> <given-names>H</given-names></name> <name><surname>Junemann</surname> <given-names>S</given-names></name> <name><surname>Prior</surname> <given-names>K</given-names></name> <name><surname>Harmsen</surname> <given-names>D</given-names></name></person-group>. <article-title>Ion torrent personal genome machine sequencing for genomic typing of <italic>Neisseria meningitidis</italic> for rapid determination of multiple layers of typing information</article-title>. <source>J Clin Microbiol.</source> (<year>2012</year>) <volume>50</volume>:<fpage>1889</fpage>&#x02013;<lpage>94</lpage>. <pub-id pub-id-type="doi">10.1128/JCM.00038-12</pub-id><pub-id pub-id-type="pmid">22461678</pub-id></citation></ref>
<ref id="B37">
<label>37.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Shiina</surname> <given-names>T</given-names></name> <name><surname>Suzuki</surname> <given-names>S</given-names></name> <name><surname>Kulski</surname> <given-names>JK</given-names></name></person-group>. <article-title>MHC genotyping in human and nonhuman species by PCR-based next-generation sequencing</article-title>. In: <person-group person-group-type="editor"><name><surname>Kulski</surname> <given-names>JK</given-names></name></person-group> editor, <source>Next Generation Sequencing</source>. <publisher-loc>Croatia</publisher-loc>:<publisher-name>Intech</publisher-name> (<year>2016</year>). p. <fpage>81</fpage>&#x02013;<lpage>109</lpage>.</citation></ref>
<ref id="B38">
<label>38.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Holcomb</surname> <given-names>CL</given-names></name> <name><surname>Rastrou</surname> <given-names>M</given-names></name> <name><surname>Williams</surname> <given-names>TC</given-names></name> <name><surname>Goodridge</surname> <given-names>D</given-names></name> <name><surname>Lazaro</surname> <given-names>AM</given-names></name> <name><surname>Tilanus</surname> <given-names>M</given-names></name> <etal/></person-group>. <article-title>Next-generation sequencing can reveal in vitro-generated PCR crossover products: some artifactual sequences correspond to HLA alleles in the IMGT/HLA database</article-title>. <source>Tissue Antigens</source> (<year>2014</year>) <volume>83</volume>:<fpage>32</fpage>&#x02013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.1111/tan.12269</pub-id><pub-id pub-id-type="pmid">24355006</pub-id></citation></ref>
<ref id="B39">
<label>39.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tamura</surname> <given-names>K</given-names></name> <name><surname>Stecher</surname> <given-names>G</given-names></name> <name><surname>Peterson</surname> <given-names>D</given-names></name> <name><surname>Filipski</surname> <given-names>A</given-names></name> <name><surname>Kumar</surname> <given-names>S</given-names></name></person-group>. <article-title>MEGA6: Molecular evolutionary genetics analysis version 6.0</article-title>. <source>Mol Biol Evol.</source> (<year>2013</year>) <volume>30</volume>:<fpage>2725</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst197</pub-id><pub-id pub-id-type="pmid">24132122</pub-id></citation></ref>
<ref id="B40">
<label>40.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saitou</surname> <given-names>N</given-names></name> <name><surname>Nei</surname> <given-names>M</given-names></name></person-group>. <article-title>The neighbor-joining method: a new method for reconstructing phylogenetic trees</article-title>. <source>Mol Biol Evol</source>. (<year>1987</year>) <volume>4</volume>:<fpage>406</fpage>&#x02013;<lpage>25</lpage>. <pub-id pub-id-type="pmid">3447015</pub-id></citation></ref>
<ref id="B41">
<label>41.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Marsh</surname> <given-names>SG</given-names></name> <name><surname>Albert</surname> <given-names>ED</given-names></name> <name><surname>Bodmer</surname> <given-names>WF</given-names></name> <name><surname>Bontrop</surname> <given-names>RE</given-names></name> <name><surname>Dupont</surname> <given-names>B</given-names></name> <name><surname>Erlich</surname> <given-names>HA</given-names></name> <etal/></person-group>. <article-title>Nomenclature for factors of the HLA system, 2010</article-title>. <source>Tissue Antigens</source> (<year>2010</year>) <volume>75</volume>:<fpage>291</fpage>&#x02013;<lpage>455</lpage>. <pub-id pub-id-type="doi">10.1111/j.1399-0039.2010.01466.x</pub-id><pub-id pub-id-type="pmid">20356336</pub-id></citation></ref>
<ref id="B42">
<label>42.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mack</surname> <given-names>SJ</given-names></name></person-group>. <article-title>A gene feature enumeration approach for describing HLA allele polymorphism</article-title>. <source>Hum Immunol.</source> (<year>2015</year>) <volume>76</volume>:<fpage>975</fpage>&#x02013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/j.humimm.2015.09.016</pub-id><pub-id pub-id-type="pmid">26416087</pub-id></citation></ref>
<ref id="B43">
<label>43.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Andersson</surname> <given-names>G</given-names></name></person-group>. <article-title>Evolution of the human HLA-DR region</article-title>. <source>Front Biosci.</source> (<year>1998</year>) <volume>3</volume>:<fpage>d739</fpage>&#x02013;<lpage>45</lpage>. <pub-id pub-id-type="pmid">9675159</pub-id></citation></ref>
<ref id="B44">
<label>44.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kulski</surname> <given-names>JK</given-names></name> <name><surname>Shigenari</surname> <given-names>A</given-names></name> <name><surname>Shiina</surname> <given-names>T</given-names></name> <name><surname>Inoko</surname> <given-names>H</given-names></name></person-group>. <article-title>Polymorphic major histocompatibility complex class II Alu insertions at five loci and their association with HLA-DRB1 and -DQB1 in Japanese and Caucasians</article-title>. <source>Tissue Antigens</source> (<year>2010</year>) <volume>76</volume>:<fpage>35</fpage>&#x02013;<lpage>47</lpage>. <pub-id pub-id-type="doi">10.1111/j.1399-0039.2010.01465.x</pub-id><pub-id pub-id-type="pmid">20403137</pub-id></citation></ref>
<ref id="B45">
<label>45.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Louis</surname> <given-names>P</given-names></name> <name><surname>Eliaou</surname> <given-names>JF</given-names></name> <name><surname>Kerlan-Candon</surname> <given-names>S</given-names></name> <name><surname>Pinet</surname> <given-names>V</given-names></name> <name><surname>Vincent</surname> <given-names>R</given-names></name> <name><surname>Clot</surname> <given-names>J</given-names></name></person-group>. <article-title>Polymorphism in the regulatory region of HLA-DRB genes correlating with haplotype evolution</article-title>. <source>Immunogenetics</source> (<year>1993</year>) <volume>38</volume>:<fpage>21</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="pmid">8462990</pub-id></citation></ref>
<ref id="B46">
<label>46.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kusano</surname> <given-names>S</given-names></name> <name><surname>Kukimoto-Niino</surname> <given-names>M</given-names></name> <name><surname>Satta</surname> <given-names>Y</given-names></name> <name><surname>Ohsawa</surname> <given-names>N</given-names></name> <name><surname>Uchikubo-Kamo</surname> <given-names>T</given-names></name> <name><surname>Wakiyama</surname> <given-names>M</given-names></name> <etal/></person-group>. <article-title>Structural basis for the specific recognition of the major antigenic peptide from the Japanese cedar pollen allergen Cry j 1 by HLA-DP5</article-title>. <source>J Mol Biol.</source> (<year>2014</year>) <volume>426</volume>:<fpage>3016</fpage>&#x02013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2014.06.020</pub-id><pub-id pub-id-type="pmid">25020231</pub-id></citation></ref>
<ref id="B47">
<label>47.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Oka</surname> <given-names>S</given-names></name> <name><surname>Furukawa</surname> <given-names>H</given-names></name> <name><surname>Kawasaki</surname> <given-names>A</given-names></name> <name><surname>Shimada</surname> <given-names>K</given-names></name> <name><surname>Sugii</surname> <given-names>S</given-names></name> <name><surname>Hashimoto</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>Protective effect of the HLA-DRB1<sup>&#x0002A;</sup>13:02 allele in Japanese rheumatoid arthritis patients</article-title>. <source>PloS One</source> (<year>2014</year>) <volume>9</volume>:<fpage>e99453</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0099453</pub-id><pub-id pub-id-type="pmid">24911054</pub-id></citation></ref>
<ref id="B48">
<label>48.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>van der</surname> <given-names>Horst-Bruinsma IE</given-names></name> <name><surname>Visser</surname> <given-names>H</given-names></name> <name><surname>Hazes</surname> <given-names>JM</given-names></name> <name><surname>Breedveld</surname> <given-names>FC</given-names></name> <name><surname>Verduyn</surname> <given-names>W</given-names></name> <name><surname>Schreuder</surname> <given-names>GM</given-names></name> <etal/></person-group>. <article-title>HLA-DQ-associated predisposition to and dominant HLA-DR-associated protection against rheumatoid arthritis</article-title>. <source>Hum Immunol.</source> (<year>1999</year>) <volume>60</volume>:<fpage>152</fpage>&#x02013;<lpage>8</lpage>.</citation></ref>
<ref id="B49">
<label>49.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mattey</surname> <given-names>DL</given-names></name> <name><surname>Dawes</surname> <given-names>PT</given-names></name> <name><surname>Gonzalez-Gay</surname> <given-names>MA</given-names></name> <name><surname>Garcia-Porrua</surname> <given-names>C</given-names></name> <name><surname>Thomson</surname> <given-names>W</given-names></name> <name><surname>Hajeer</surname> <given-names>AH</given-names></name> <etal/></person-group>. <article-title>HLA-DRB1 alleles encoding an aspartic acid at position 70 protect against development of rheumatoid arthritis</article-title>. <source>J Rheumatol.</source> (<year>2001</year>) <volume>28</volume>:<fpage>232</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.humimm.2003.12.009</pub-id><pub-id pub-id-type="pmid">11246655</pub-id></citation></ref>
<ref id="B50">
<label>50.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gourraud</surname> <given-names>PA</given-names></name> <name><surname>Dieude</surname> <given-names>P</given-names></name> <name><surname>Boyer</surname> <given-names>JF</given-names></name> <name><surname>Nogueira</surname> <given-names>L</given-names></name> <name><surname>Cambon-Thomsen</surname> <given-names>A</given-names></name> <name><surname>Mazieres</surname> <given-names>B</given-names></name> <etal/></person-group>. <article-title>A new classification of HLA-DRB1 alleles differentiates predisposing and protective alleles for autoantibody production in rheumatoid arthritis</article-title>. <source>Arthritis Res Ther.</source> (<year>2007</year>) <volume>9</volume>:<fpage>R27</fpage>. <pub-id pub-id-type="doi">10.1186/ar2131</pub-id><pub-id pub-id-type="pmid">17328818</pub-id></citation></ref>
<ref id="B51">
<label>51.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mewar</surname> <given-names>D</given-names></name> <name><surname>Marinou</surname> <given-names>I</given-names></name> <name><surname>Coote</surname> <given-names>AL</given-names></name> <name><surname>Moore</surname> <given-names>DJ</given-names></name> <name><surname>Akil</surname> <given-names>M</given-names></name> <name><surname>Smillie</surname> <given-names>D</given-names></name> <etal/></person-group>. <article-title>Association between radiographic severity of rheumatoid arthritis and shared epitope alleles: differing mechanisms of susceptibility and protection</article-title>. <source>Ann Rheum Dis.</source> (<year>2008</year>) <volume>67</volume>:<fpage>980</fpage>&#x02013;<lpage>3</lpage>. <pub-id pub-id-type="doi">10.1136/ard.2007.075382</pub-id><pub-id pub-id-type="pmid">17901090</pub-id></citation></ref>
<ref id="B52">
<label>52.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Turner</surname> <given-names>TR</given-names></name> <name><surname>Hayhurst</surname> <given-names>JD</given-names></name> <name><surname>Hayward</surname> <given-names>DR</given-names></name> <name><surname>Bultitude</surname> <given-names>WP</given-names></name> <name><surname>Barker</surname> <given-names>DJ</given-names></name> <name><surname>Robinson</surname> <given-names>J</given-names></name> <etal/></person-group>. <article-title>Single molecule real-time DNA sequencing of HLA genes at ultra-high resolution from 126 International HLA and Immunogenetics Workshop cell lines</article-title>. <source>Hla</source> (<year>2018</year>) <volume>91</volume>:<fpage>88</fpage>&#x02013;<lpage>101</lpage>. <pub-id pub-id-type="doi">10.1111/tan.13184</pub-id><pub-id pub-id-type="pmid">29171935</pub-id></citation></ref>
<ref id="B53">
<label>53.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Albrecht</surname> <given-names>V</given-names></name> <name><surname>Zweiniger</surname> <given-names>C</given-names></name> <name><surname>Surendranath</surname> <given-names>V</given-names></name> <name><surname>Lang</surname> <given-names>K</given-names></name> <name><surname>Schofl</surname> <given-names>G</given-names></name> <name><surname>Dahl</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>Dual redundant sequencing strategy: full-length gene characterisation of 1056 novel and confirmatory HLA alleles</article-title>. <source>Hla</source> (<year>2017</year>) <volume>90</volume>:<fpage>79</fpage>&#x02013;<lpage>87</lpage>. <pub-id pub-id-type="doi">10.1111/tan.13057</pub-id><pub-id pub-id-type="pmid">28547825</pub-id></citation></ref>
<ref id="B54">
<label>54.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chitnis</surname> <given-names>N</given-names></name> <name><surname>Clark</surname> <given-names>PM</given-names></name> <name><surname>Kamoun</surname> <given-names>M</given-names></name> <name><surname>Stolle</surname> <given-names>C</given-names></name> <name><surname>Brad Johnson</surname> <given-names>F</given-names></name> <name><surname>Monos</surname> <given-names>DS</given-names></name></person-group>. <article-title>An expanded role for HLA genes: HLA-B encodes a microRNA that regulates IgA and other immune response transcripts</article-title>. <source>Front Immunol.</source> (<year>2017</year>) <volume>8</volume>:<fpage>583</fpage>. <pub-id pub-id-type="doi">10.3389/fimmu.2017.00583</pub-id><pub-id pub-id-type="pmid">28579988</pub-id></citation></ref>
<ref id="B55">
<label>55.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>van den Elsen</surname> <given-names>PJ</given-names></name></person-group>. <article-title>Expression regulation of major histocompatibility complex class I and class II encoding genes</article-title>. <source>Front Immunol.</source> (<year>2011</year>) <volume>2</volume>:<fpage>48</fpage>. <pub-id pub-id-type="doi">10.3389/fimmu.2011.00048</pub-id><pub-id pub-id-type="pmid">22566838</pub-id></citation></ref>
<ref id="B56">
<label>56.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Castelli</surname> <given-names>EC</given-names></name> <name><surname>Veiga-Castelli</surname> <given-names>LC</given-names></name> <name><surname>Yaghi</surname> <given-names>L</given-names></name> <name><surname>Moreau</surname> <given-names>P</given-names></name> <name><surname>Donadi</surname> <given-names>EA</given-names></name></person-group>. <article-title>Transcriptional and posttranscriptional regulations of the HLA-G gene</article-title>. <source>J Immunol Res.</source> (<year>2014</year>) <volume>2014</volume>:<fpage>734068</fpage>. <pub-id pub-id-type="doi">10.1155/2014/734068</pub-id><pub-id pub-id-type="pmid">24741620</pub-id></citation></ref>
<ref id="B57">
<label>57.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moolhuijzen</surname> <given-names>P</given-names></name> <name><surname>Kulski</surname> <given-names>JK</given-names></name> <name><surname>Dunn</surname> <given-names>DS</given-names></name> <name><surname>Schibeci</surname> <given-names>D</given-names></name> <name><surname>Barrero</surname> <given-names>R</given-names></name> <name><surname>Gojobori</surname> <given-names>T</given-names></name> <etal/></person-group>. <article-title>The transcript repeat element: the human Alu sequence as a component of gene networks influencing cancer</article-title>. <source>Funct Integr Genomics</source> (<year>2010</year>) <volume>10</volume>:<fpage>307</fpage>&#x02013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1007/s10142-010-0168-1</pub-id><pub-id pub-id-type="pmid">20393868</pub-id></citation></ref>
<ref id="B58">
<label>58.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chuong</surname> <given-names>EB</given-names></name> <name><surname>Elde</surname> <given-names>NC</given-names></name> <name><surname>Feschotte</surname> <given-names>C</given-names></name></person-group>. <article-title>Regulatory activities of transposable elements: from conflicts to benefits</article-title>. <source>Nat Rev Genet.</source> (<year>2017</year>) <volume>18</volume>:<fpage>71</fpage>&#x02013;<lpage>86</lpage>. <pub-id pub-id-type="doi">10.1038/nrg.2016.139</pub-id><pub-id pub-id-type="pmid">27867194</pub-id></citation></ref>
<ref id="B59">
<label>59.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zino</surname> <given-names>E</given-names></name> <name><surname>Frumento</surname> <given-names>G</given-names></name> <name><surname>Marktel</surname> <given-names>S</given-names></name> <name><surname>Sormani</surname> <given-names>MP</given-names></name> <name><surname>Ficara</surname> <given-names>F</given-names></name> <name><surname>Di Terlizzi</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>A T-cell epitope encoded by a subset of HLA-DPB1 alleles determines nonpermissive mismatches for hematologic stem cell transplantation</article-title>. <source>Blood</source> (<year>2004</year>) <volume>103</volume>:<fpage>1417</fpage>&#x02013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2003-04-1279</pub-id><pub-id pub-id-type="pmid">14576061</pub-id></citation></ref>
<ref id="B60">
<label>60.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morishima</surname> <given-names>S</given-names></name> <name><surname>Shiina</surname> <given-names>T</given-names></name> <name><surname>Suzuki</surname> <given-names>S</given-names></name> <name><surname>Ogawa</surname> <given-names>S</given-names></name> <name><surname>Sato-Otsubo</surname> <given-names>A</given-names></name> <name><surname>Kashiwase</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Evolutionary basis of HLA-DPB1 alleles affects acute GVHD in unrelated donor stem cell transplantation</article-title>. <source>Blood</source> (<year>2018</year>) <volume>131</volume>:<fpage>808</fpage>&#x02013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2017-08-801449</pub-id><pub-id pub-id-type="pmid">29246901</pub-id></citation></ref>
<ref id="B61">
<label>61.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dunn</surname> <given-names>DS</given-names></name> <name><surname>Inoko</surname> <given-names>H</given-names></name> <name><surname>Kulski</surname> <given-names>JK</given-names></name></person-group>. <article-title>The association between non-melanoma skin cancer and a young dimorphic Alu element within the major histocompatibility complex class I genomic region</article-title>. <source>Tissue Antigens</source> (<year>2006</year>) <volume>68</volume>:<fpage>127</fpage>&#x02013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1111/j.1399-0039.2006.00631.x</pub-id><pub-id pub-id-type="pmid">16866882</pub-id></citation></ref>
</ref-list>
<glossary>
<def-list>
<title>Abbreviations</title>
<def-item><term>MHC</term>
<def><p>Major histocompatibility complex</p></def></def-item>
<def-item><term>HLA</term>
<def><p>Human leukocyte antigen</p></def></def-item>
<def-item><term>GVHD</term>
<def><p>Graft-versus-host disease</p></def></def-item>
<def-item><term>PCR</term>
<def><p>Polymerase chain reaction</p></def></def-item>
<def-item><term>RFLP</term>
<def><p>Restriction fragment polymorphisms</p></def></def-item>
<def-item><term>SSCP</term>
<def><p>Single strand conformation polymorphism</p></def></def-item>
<def-item><term>SSO</term>
<def><p>Sequence specific oligonucleotides</p></def></def-item>
<def-item><term>SSP</term>
<def><p>Sequence specific primers</p></def></def-item>
<def-item><term>SBT</term>
<def><p>Sequence based typing</p></def></def-item>
<def-item><term>UTR</term>
<def><p>Untranslated region</p></def></def-item>
<def-item><term>NGS</term>
<def><p>Next generation sequencing</p></def></def-item>
<def-item><term>SS-SBT</term>
<def><p>Super high resolution-single molecule-sequence-based typing</p></def></def-item>
<def-item><term>SNP</term>
<def><p>Single nucleotide polymorphism</p></def></def-item>
<def-item><term>SNV</term>
<def><p>Single nucleotide variation</p></def></def-item>
<def-item><term>SMRT</term>
<def><p>Single molecule, real-time</p></def></def-item>
<def-item><term>Indel</term>
<def><p>Insertion and deletion</p></def></def-item>
<def-item><term>RA</term>
<def><p>Rheumatoid arthritis</p></def></def-item>
<def-item><term>LAA</term>
<def><p>Long Amplicon Analysis</p></def></def-item>
<def-item><term>SD</term>
<def><p>Standard deviation</p></def></def-item>
<def-item><term>CDS</term>
<def><p>Coding sequence</p></def></def-item>
<def-item><term>SINE</term>
<def><p>Short interspersed nuclear element</p></def></def-item>
<def-item><term>LINE</term>
<def><p>Long interspersed nuclear element</p></def></def-item>
<def-item><term>HIV</term>
<def><p>Human Immunodeficiency Virus</p></def></def-item>
<def-item><term>UR-HCT</term>
<def><p>unrelated hematopoietic cell transplantation</p></def></def-item>
<def-item><term>TCE</term>
<def><p>T-cell epitope</p></def></def-item>
<def-item><term>MER</term>
<def><p>Medium reiterated repeat</p></def></def-item>
<def-item><term>LTR</term>
<def><p>Long terminal repeat</p></def></def-item>
<def-item><term>SNR</term>
<def><p>noise ratio</p></def></def-item>
<def-item><term>emPCR</term>
<def><p>Emulsion PCR</p></def></def-item>
<def-item><term>Blat</term>
<def><p>BLAST-like alignment tool</p></def></def-item>
<def-item><term>QV</term>
<def><p>quality value</p></def></def-item>
<def-item><term>SeaBass</term>
<def><p>Sequence Alignment Based Assigning Software.</p></def></def-item>
</def-list>
</glossary>
<fn-group>
<fn fn-type="financial-disclosure"><p><bold>Funding.</bold> This work was supported by MEXT KAKENHI (No. 16H06502), and by the Practical Research Project for Allergic Diseases and Immunology (Research on Technology of Medical Transplantation) from the Japan Agency for Medical Research and Development (Nos. 15ek0510002h0202 and 17ek0510022s0301) and 2015 and 2016 Tokai University School of Medicine Research Aid.</p>
</fn>
</fn-group>
</back>
</article>