<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Immunol.</journal-id>
<journal-title>Frontiers in Immunology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Immunol.</abbrev-journal-title>
<issn pub-type="epub">1664-3224</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fimmu.2025.1603730</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Immunology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Large-scale statistical mapping of T-cell receptor <italic>&#x3b2;</italic> sequences to human leukocyte antigens</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zahid</surname>
<given-names>H. Jabran</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2844730/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Taniguchi</surname>
<given-names>Ruth</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ebert</surname>
<given-names>Peter</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chow</surname>
<given-names>I-Ting</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gooley</surname>
<given-names>Chris</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lv</surname>
<given-names>Jinpeng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Pisani</surname>
<given-names>Lorenzo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rusnak</surname>
<given-names>Mikaela</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Elyanow</surname>
<given-names>Rebecca</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Takamatsu</surname>
<given-names>Hiroyuki</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhou</surname>
<given-names>Wenyu</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Greissl</surname>
<given-names>Julia</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Robins</surname>
<given-names>Harlan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Carlson</surname>
<given-names>Jonathan M.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Microsoft Research</institution>, <addr-line>Redmond, WA</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Adaptive Biotechnologies</institution>, <addr-line>Seattle, WA</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Faculty of Transdisciplinary Sciences for Innovation, Institute of Transdisciplinary Sciences for Innovation/Department of Hematology, Kanazawa University</institution>, <addr-line>Kanazawa</addr-line>,&#xa0;<country>Japan</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/24021/overview">Jonathan S Duke-Cohan</ext-link>, Dana&#x2013;Farber Cancer Institute, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/891160/overview">Eun Young Choi</ext-link>, Seoul National University, Republic of Korea</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1490265/overview">Santrupti Nerli</ext-link>, Genentech, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: H. Jabran Zahid, <email xlink:href="mailto:hzahid@microsoft.com">hzahid@microsoft.com</email>; Harlan Robins, <email xlink:href="mailto:hrobins@adaptivebiotech.com">hrobins@adaptivebiotech.com</email>; Jonathan M. Carlson, <email xlink:href="mailto:carlson@microsoft.com">carlson@microsoft.com</email>
</p>
</fn>
<fn fn-type="deceased" id="fn003">
<p>&#x2020;Deceased</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>27</day>
<month>08</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1603730</elocation-id>
<history>
<date date-type="received">
<day>31</day>
<month>03</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>31</day>
<month>07</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Zahid, Taniguchi, Ebert, Chow, Gooley, Lv, Pisani, Rusnak, Elyanow, Takamatsu, Zhou, Greissl, Robins and Carlson.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Zahid, Taniguchi, Ebert, Chow, Gooley, Lv, Pisani, Rusnak, Elyanow, Takamatsu, Zhou, Greissl, Robins and Carlson</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>T-cell receptors (TCRs) interacting with peptides presented by human leukocyte antigens (HLAs) are the foundation of the adaptive immune system, but population-level analysis of TCR&#x2013;HLA interactions is lacking.</p>
</sec>
<sec>
<title>Methods</title>
<p>We statistically associated approximately 10<sup>6</sup> public TCR&#x3b2;s to specific HLAs using TCR&#x3b2; repertoires sampled from 4,144 HLA-genotyped subjects. The TCR&#x3b2;s we associated were specific to unique HLA allotypes, not allelic groups, and to the paired &#x3b1;&#x2013;&#x3b2; heterodimer of class II HLAs, though exceptions were observed.</p>
</sec>
<sec>
<title>Results</title>
<p>This specificity permitted highly accurate imputation of 248 class I and II HLAs from the TCR&#x3b2; repertoire. Notably, 45 HLA-DP and -DQ heterodimers lacked associated TCRs because they likely arise from non-functional trans-complementation. The public class I and II HLA-associated TCR&#x3b2;s we identified were primarily expressed on CD8<sup>+</sup> and CD4<sup>+</sup> memory T cells, respectively, which were responding to various common antigens.</p>
</sec>
<sec>
<title>Discussion</title>
<p>Our results recapitulate fundamental biology, provide insights into the functionality of HLAs, and demonstrate the power and potential of population-level TCR&#x3b2; repertoire sequencing.</p>
</sec>
</abstract>
<kwd-group>
<kwd>human leukocyte antigen</kwd>
<kwd>T cell</kwd>
<kwd>immunology</kwd>
<kwd>T cell - HLA interaction</kwd>
<kwd>T cell repertoire</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="3"/>
<equation-count count="2"/>
<ref-count count="75"/>
<page-count count="24"/>
<word-count count="13788"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>T Cell Biology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>The major histocompatibility complex (MHC) is a set of genes found in jawed vertebrates, which in humans encode for human leukocyte antigens (HLAs) (<xref ref-type="bibr" rid="B1">1</xref>). The primary function of HLAs is to present fragments of proteins (i.e., peptides or antigens) on the surface of cells for T cell recognition (<xref ref-type="bibr" rid="B2">2</xref>). TCRs on the surface of T cells interact with the peptides presented by HLAs (pHLA). The TCR-pHLA interaction is a key mechanism of adaptive immunity and plays a central role in the immune system&#x2019;s response to infections, cancers, allergens and self-tissues targeted in autoimmunity and transplantation (<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B10">10</xref>).</p>
<p>HLAs are both polygenic and polymorphic, allowing for a highly specific and fine-tuned adaptive immune response to diverse pathogens. The classical antigen-presenting MHC proteins&#x2014;class I and class II HLAs&#x2014;are found on the surface of all nucleated and professional antigen presenting cells, respectively. A large number of allelic variants have been identified across the six loci encoding class I (HLA-A, -B and -C) and class II (HLA-DP, -DQ and -DR) HLAs (<xref ref-type="bibr" rid="B11">11</xref>). Antigens presented to T cells bind to a single polymorphic <italic>&#x3b1;</italic> chain of class I HLAs (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B13">13</xref>) and to the <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> chain of class II HLAs (<xref ref-type="bibr" rid="B14">14</xref>&#x2013;<xref ref-type="bibr" rid="B16">16</xref>). Both the <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> chains are polymorphic for HLA-DPand -DQ whereas only the <italic>&#x3b2;</italic> chain is polymorphic for -DR. Furthermore, the <italic>&#x3b2;</italic> chain of HLA-DR may be encoded by four loci (<italic>DRB1</italic>, <italic>DRB3</italic>, <italic>DRB4</italic> and <italic>DRB5</italic>); all individuals have <italic>DRB1</italic> encoded on both instances of chromosome 6 and may additionally have one of <italic>DRB3</italic>, <italic>DRB4</italic> or <italic>DRB5</italic> on each chromosome 6.</p>
<p>HLA genes can be resolved to varying degrees by sequencing and several distinct naming systems can be found in the literature. Here we adopt the 2010 WHO HLA nomenclature (<xref ref-type="bibr" rid="B17">17</xref>). For each locus, the first two fields designate the allele group and specific protein (i.e. allotype), respectively. The third and fourth fields indicate synonymous substitutions in coding and non-coding regions, respectively. For class II HLAs, the <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> chains are encoded, sequenced and typed independently. Our sequencing of HLAs lacks information on parental haplotype (i.e., phasing). In the context of molecular epidemiology, identifying (or assuming) the resolution at which causal mechanisms (and thus, clinical associations) are likely operating remains challenging. HLAs in the same allelic group tend to present similar or identical peptides (<xref ref-type="bibr" rid="B18">18</xref>), share functional properties such as relative expression levels (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B20">20</xref>), and serve as ligands for the same KIR receptors (<xref ref-type="bibr" rid="B21">21</xref>). Thus, many epidemiological and functional studies treat HLAs of the same allelic group interchangeably. However, structural (<xref ref-type="bibr" rid="B22">22</xref>), functional (<xref ref-type="bibr" rid="B23">23</xref>), and evolutionary evidence (<xref ref-type="bibr" rid="B24">24</xref>) suggest that, atleast in some contexts, very similar HLA allotypes frequently interact with very different TCRs. A fundamental goal of this work is to establish the relationship between TCR specificity and HLA resolution and to explore the TCR specificity of class I andclass II HLAs.</p>
<p>The human body maintains a diverse set of naive T cells where antigen specificity is determined by TCRs (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B26">26</xref>). These T cells are selected such that their TCRs, which are generated via V(D)J recombination, interact with pHLAs in the thymus (<xref ref-type="bibr" rid="B27">27</xref>&#x2013;<xref ref-type="bibr" rid="B30">30</xref>). Interaction with class I and class II pHLAs directs differentiation into CD8<sup>+</sup> (cytotoxic T cell) (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B32">32</xref>) and CD4<sup>+</sup> (helper T cell) lineages (<xref ref-type="bibr" rid="B33">33</xref>), respectively. Antigen presentation by an HLA and subsequent TCR recognition in the appropriate immunological context triggers clonal expansion of naive T cells resulting in a large population of T cells expressing identical cognate TCRs (<xref ref-type="bibr" rid="B34">34</xref>). Clonal expansion of T cells with the same TCR greatly increases the chance of sampling these TCRs experimentally. As a result, subjects with matching HLAs and shared antigenic exposure have a significantly higher likelihood of sharing subsets of TCRscompared to subjects with differing HLAs and/or antigenic exposure history (<xref ref-type="bibr" rid="B35">35</xref>&#x2013;<xref ref-type="bibr" rid="B38">38</xref>). Here we leverage this aspect of T-cell biology to identify sets of public TCR<italic>&#x3b2;</italic>s that are over-represented in subjects sharing HLAs. We expect these sets to be enriched for HLA-restricted TCR<italic>&#x3b2;</italic>s specific to common antigens and we use them to probe the functional nature of HLAs.</p>
<p>The T-cell repertoire is a rich source of information for understanding adaptive immunity (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B40">40</xref>). The vast majority of TCRs are heterodimers composed of an <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> chain which together encode pHLA specificity. Our data consists of T-cell repertoires of TCR<italic>&#x3b2;</italic> sequences; the paired <italic>&#x3b1;</italic> chain is unknown. While any given TCR<italic>&#x3b2;</italic> chain may randomly pair with many <italic>&#x3b1;</italic> chains, the memory T cell compartment appears to be dominated by <italic>&#x3b2;</italic> chains that pair with a single <italic>&#x3b1;</italic> chain (<xref ref-type="bibr" rid="B41">41</xref>). This observation results from the fact that TCR-pHLA binding only occurs with very specific TCR<italic>&#x3b1;&#x3b2;</italic> combinations and these specific TCRs are significantly more likely to be sampled in a repertoire due to clonal expansion driven by antigen recognition. Furthermore, if the response is to a common antigen, the TCR<italic>&#x3b2;</italic> may be observed in multiple subjects (<xref ref-type="bibr" rid="B35">35</xref>, <xref ref-type="bibr" rid="B37">37</xref>).</p>
<p>Given that memory T cells undergo strong clonal selection for specific TCR<italic>&#x3b1;&#x3b2;</italic> pairs and that some TCRs recur across individuals who share both HLA alleles and exposure history, we hypothesize that public TCR<italic>&#x3b2;</italic>s associated with specific HLAs are memory T cells targeting the same antigens presented by multiple individuals who share the appropriate restricting HLAs and pathogenic exposure history. While TCRs are inherently cross-reactive and capable of recognizing many distinct pMHCs (<xref ref-type="bibr" rid="B42">42</xref>), any given individual encounters only a small subset of the total antigenic space. Moreover, only a fraction of exposures are sufficiently common to elicit reproducible, public TCR responses across individuals. We will show consistent associations between specific TCR<italic>&#x3b2;</italic>s and HLAs, reflecting both underlying biological specificity and the ability of our approach to identify reproducible, public signals. These associations suggest that the <italic>&#x3b2;</italic> chains are typically paired with compatible&#x2014;albeit unknown&#x2014;<italic>&#x3b1;</italic> chains that preserve specificity to the same pHLAs. Thus, we will demonstrate that for the public TCR<italic>&#x3b2;</italic> sequences that we statistically associate with specific HLAs, shared pHLA specificity can be inferred from TCR<italic>&#x3b2;</italic> alone. Recent independent work has also explored statistical associations between TCRs and HLA genotypes using public repertoire data (<xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B44">44</xref>), further supporting the value of population-scale immunosequencing.</p>
<p>Here we use high-throughput genetic sequencing (<xref ref-type="bibr" rid="B45">45</xref>, <xref ref-type="bibr" rid="B46">46</xref>) of the T-cell repertoires of 4,144 subjects with HLA genotypes measured from direct-sequencing to identify ~ 10<sup>6</sup> public TCR<italic>&#x3b2;</italic>s that are statistically associated with HLA allotypes. While observing any given TCR<italic>&#x3b2;</italic> in a repertoire may be rare, the TCR<italic>&#x3b2;</italic> repertoire of an individual expressing a given HLA will almost always contain many TCR<italic>&#x3b2;</italic>s that we associate with that HLA. The TCR<italic>&#x3b2;</italic>s we associate to HLAs provide a new window into understanding the interaction between TCR and HLAs. The public nature of these TCR<italic>&#x3b2;</italic>s and their robust HLA associations permit highly accurate imputation of class I and II HLA allotypes solely from TCR<italic>&#x3b2;</italic> repertoires allowing us to probe functional characteristics of HLAs with respect to their TCR<italic>&#x3b2;</italic> interactions.</p>
</sec>
<sec id="s2" sec-type="results">
<title>Results</title>
<sec id="s2_1">
<title>Identification of HLA-associated TCR<italic>&#x3b2;s</italic>
</title>
<p>Our data consist of the sequenced T-cell repertoires of 4,144 subjects with HLAs genotyped via next generation sequencing (NGS) (<xref ref-type="bibr" rid="B47">47</xref>) (see <xref ref-type="supplementary-material" rid="SF1">
<bold>Supplementary Figure S1</bold>
</xref> for demographic distributions). The median number of unique T cells sequenced from each individual is ~ 227,000 and 90% of subjects have counts between ~ 74,000 and ~ 610,000. The majority of our samples are taken from healthy adults residing in the United States; ~ 5% and ~ 20% are Lyme and Covid positive, respectively. For a given HLA, we separate subjects into cases and controls defined as those with and without the HLA, respectively. Subjects expressing an HLA that is in the same p-group<xref ref-type="fn" rid="fn1">
<sup>1</sup>
</xref> as the HLA of interest are excluded from the control group, as such HLAs have identical amino acid sequences in the peptide binding region and thus may share TCR specificity. HLA-DP and -DQ are treated as heterodimers, with cases and controls defined by <italic>&#x3b1;</italic>-<italic>&#x3b2;</italic> pairs. The <italic>&#x3b1;</italic> chain of HLA-DR is invariant and thus we treat these HLAs as monomers, similar to class I HLAs. We randomly select a fixed 80% and 20% of the samples for training and validation, respectively, and evaluate model generalization on an entirely independent cohort from Kanazawa, Japan.</p>
<p>We identify sets of public HLA-associated TCR<italic>&#x3b2;</italic>s using a statistical approach that enforces the assumption that any TCR<italic>&#x3b2;</italic> is associated with at most one HLA allotype (we test this assumption below). This assumption enables us to disentangle the effects of linkage disequilibrium (LD) among HLA loci (<xref ref-type="bibr" rid="B48">48</xref>) that would otherwise result in a large number of spurious HLA-TCR associations (<xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figure S2A</bold>
</xref>). We use exact matching of the TCR<italic>&#x3b2;</italic> V-gene, J-gene and CDR3 to identify sequences thatare over-represented in subjects with a given HLA allotype. Thus, our association of TCR<italic>&#x3b2;</italic>s with HLAs is agnostic to the specific amino acid sequence, it solely relies on it being observed in multiple repertoires.</p>
<p>Our assumption that TCRs typically associate with a single HLA allotype is important for resolving LD but is also supported by current biological evidence. While TCRs may be theoretically capable of broad cross-reactivity (<xref ref-type="bibr" rid="B42">42</xref>), there is limited experimental evidence that public TCRs functionally recognize multiple unrelated pHLAs. Rather, evidence suggests that functional cross-reactivity may be rare, with TCRs typically exhibiting specificity for particular epitopes and HLAs (<xref ref-type="bibr" rid="B49">49</xref>&#x2013;<xref ref-type="bibr" rid="B51">51</xref>). Nonetheless, the true extent of functional cross-reactivity in physiologically relevant settings remains an open question. Our sequence identification procedure is primarily powered to detect public TCR<italic>&#x3b2;</italic>s associated with a single HLA and has limited sensitivity to detect sequences with broad cross-reactivity, if such sequences exist.</p>
<p>The identification procedure works as follows (see Methods for precise details): for each HLA allotype, we first create a set of candidate HLA-associated TCR<italic>&#x3b2;</italic>s using a one-sided Fisher&#x2019;s Exact Test (FET) to identify TCR<italic>&#x3b2;</italic>s over-represented in cases. We adopt a pre-specified fiducial p-value threshold, <italic>p</italic>
<sup>*</sup>. For each unique candidate TCR<italic>&#x3b2;</italic>, we fit an L1-regularized Logistic Regression (L1LR) model which predicts the presence of that TCR<italic>&#x3b2;</italic> in subjects given their HLAs (represented as abinary vector of indicator variables). We tune the L1 hyperparameter <italic>&#x3bb;</italic> to be the smallest value for which exactly one HLA parameter is non-zero. In other words, we determine which single HLA allotype best predicts the observed distribution of a given TCR<italic>&#x3b2;</italic> in the repertoires of our training sample. We test all TCR<italic>&#x3b2;</italic>s with p-values &lt; <italic>p</italic>
<sup>*</sup> and retain only TCR<italic>&#x3b2;</italic>s which associate most strongly with the HLA being modeled. As our interest here is primarily in the characteristics of titsets of HLA-associated TCR<italic>&#x3b2;</italic>s, we set <italic>p</italic>
<sup>*</sup> to a permissive value of <italic>p</italic>
<sup>*</sup> = 10<sup>-4</sup> and use the hold-out repertoires for validation. Note that due to exclusion of p-group matched HLAs a small number of TCR<italic>&#x3b2;</italic>s are assigned to multiple HLAs due to variations in the training data (<xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figure S2B</bold>
</xref>).</p>
<p>We associate ~ 10<sup>6</sup> TCR<italic>&#x3b2;</italic>s to specific HLAs, for a median of 2,400 TCR<italic>&#x3b2;</italic>s per HLA with ~ 70% of HLAs having a total number of associated TCR<italic>&#x3b2;</italic>s in the range of 1,600-5,000. To maintain consistency with other work associating TCR<italic>&#x3b2;</italic>s with disease (<xref ref-type="bibr" rid="B37">37</xref>, <xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B53">53</xref>), we refer to these HLA-associated TCR<italic>&#x3b2;</italic>s as e<italic>nhanced sequences</italic> (ES).</p>
</sec>
<sec id="s2_2">
<title>TCR specificity</title>
<sec id="s2_2_1">
<title>Most enhanced sequences are specific to HLA allotypes</title>
<p>To validate the HLA allotype specificity of ESs, we compare their abundance in HLA cases as compared to controls in our holdout set (see <xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1A, B</bold>
</xref>). Overall, we find clear separation of cases and controls in the holdout data across all functional HLAs (<xref ref-type="supplementary-material" rid="SF3">
<bold>Supplementary Figure S3</bold>
</xref>-<xref ref-type="supplementary-material" rid="SF8">
<bold>S8</bold>
</xref>), highlighting the specificity of these ESs at the HLA allotype level and to the heterodimer for class II HLAs. However, there are notable exceptions.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>TCR<italic>&#x3b2;</italic> specificity and apparent TCR<italic>&#x3b2;</italic> sharing between some HLA allotypes. ESs for A*02:01 discriminate cases and controls in <bold>(A)</bold> train and <bold>(B)</bold> holdout samples. <bold>(C)</bold> A*23:01 ES counts observed in each sample as a function of sequencing depth. A*23:01 negative, A*23:17 positive subjects have counts consistent with A*23:01 positive subjects and vice-versa in <bold>(D)</bold>. A*23:01 and A*23:17 appear to share the same TCR<italic>&#x3b2;</italic> specificity. <bold>(E)</bold> B*44:02 ES counts observed in each sample as afunction of sequencing depth. ESs discriminate B*44:02 positive subjects from B*44:02 negative subjects. However, B*44:03 and B*44:05 positive subjects (green dots) have elevated counts as compared to controls (blue dots). <bold>(F)</bold> ES counts plotted against sequencing depth for the subset of ESs which associate more strongly with the B*44 group as compared to B*44:02 allotype (identified using the L1LR association method). The subset of ESs in <bold>(F)</bold> elevate all B*44 positive subjects equally suggesting the TCR<italic>&#x3b2;</italic>s in this ES subset are specific to the three allotypes in the group. <bold>(G)</bold> ES counts plotted against sequencing depth for the subset of ESs which associate only to B*44:02, i.e., this set excludes the ESs shown in <bold>(F)</bold>. ESs plotted in <bold>(G)</bold> clearly separate B*44:02 positive subjects from B*44:02 negative subjects, including other allotypes in the B*44 group.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-16-1603730-g001.tif">
<alt-text content-type="machine-generated">Seven scatter plots showing relationships between total unique rearrangements and enhanced sequence count. Panels A and B compare train and holdout groups by controls and cases. Panels C and D analyze different A alleles, and panels E, F, and G analyze B alleles. Each plot displays a positive trend, with specific allele groupings marked by color-coded dots.</alt-text>
</graphic>
</fig>
<p>We identify one HLA class I allotype pair (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1A, B</bold>
</xref>) and 11 class II pairs (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>) that appear to completely share TCR<italic>&#x3b2;s</italic> despite differing in their two-field designation. We refer to these as &#x201c;degenerate&#x201d; HLAs. For each of these degenerate pairs, ESs specific to one HLA are equally distributed among individuals expressing either HLA (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1C, D</bold>
</xref>). Ten of the twelve degenerate HLAs we identify have amino acid differences in a single position not in the peptide presentation and TCR binding domain and thus are in the same p-group.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>List of degenerate HLAs.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Reported</th>
<th valign="middle" align="left">Degenerate</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">A*23:01</td>
<td valign="middle" align="left">A*23:17</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*03:01</td>
<td valign="middle" align="left">DPA1*01:03+DPB1*104:01</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*17:01</td>
<td valign="middle" align="left">DPA1*02:01+DPB1*131:01</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*02:02</td>
<td valign="middle" align="left">DQA1*02:01+DQB1*02:01</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*03:01</td>
<td valign="middle" align="left">DQA1*03:01+DQB1*03:01</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:01+DQB1*03:02</td>
<td valign="middle" align="left">DQA1*03:03+DQB1*03:02</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*02:02</td>
<td valign="middle" align="left">DQA1*03:03+DQB1*02:01</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*03:01</td>
<td valign="middle" align="left">DQA1*05:01+DQB1*03:01,</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*03:01</td>
<td valign="middle" align="left">DQA1*05:05+DQB1*03:19</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*02:01</td>
<td valign="middle" align="left">DQA1*05:05+DQB1*02:01</td>
</tr>
<tr>
<td valign="middle" align="left">DRB4*01:03</td>
<td valign="middle" align="left">DRB4*01:01</td>
</tr>
<tr>
<td valign="middle" align="left">DRB5*02:02</td>
<td valign="middle" align="left">DRB5*02:21</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>We are unable to distinguish between these sets of HLAs using TCR&#x3b2; based typing as they have identical TCR&#x3b2; specificities. When modeling degenerate HLAs, we only report the most commonly occurring HLA in the set.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>To further validate our assumption that most of these TCR<italic>&#x3b2;</italic>s are specific to HLA allotypes, not allelic groups (with the exception of noted degenerate pairs), we use the L1LR method to assign TCR<italic>&#x3b2;</italic>s to either the allelic group (1-field) or the allotype (2-field). We restrict our analysis to class I HLA groups observed in &gt;200 subjects with the most common allotype representing &lt;70% of subjects. Among the six allelic groups tested, we find five have a negligible fraction (~ 1%) of ES associated to the group (A*30, A*33, A*68, B*15, B*35, C*07), indicating that the majority of HLA-associated TCR<italic>&#x3b2;</italic>s we identify are allotype specific.</p>
<p>We find one HLA group where a subset of TCR<italic>&#x3b2;</italic>s in the ES set appear to be specific to multiple allotypes in the group: B*44. We find that 10% of TCR<italic>&#x3b2;</italic>s originally identified as B*44:03-specific are assigned to the B*44 group (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1E-G</bold>
</xref>; similar conclusions are reached when starting with the less prevalent B*44 allotypes). This set of B*44-specific TCR<italic>&#x3b2;</italic>s segregate all B*44 positive from negative individuals in the holdout (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1F</bold>
</xref>), while the remaining ~ 90% of TCR<italic>&#x3b2;</italic>s originally identified as B*44:03-specific separate B*44:03-expressing individuals from those who express B*44:02 or 44:05 (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1G</bold>
</xref>). These three B*44 allotypes differ in only two amino acids (residue 140 and/or 180), and B*44:02 and 44:03 are known to share a large fraction of their peptide repertoire and some of their TCR repertoire (<xref ref-type="bibr" rid="B54">54</xref>).</p>
<p>Degenerate HLAs that completely share their TCR repertoire typically differ in one amino acid outside the binding domain. Similarly, B*44 has two polymorphic positions outside the binding domain and displays a high degree of sharing. On the other hand, groups in which we observe no TCR<italic>&#x3b2;</italic> sharing tend to have one or more amino acid differences in the binding domain. Thus, the degree of sharing we observe appears to be correlated to the number of differing residues and the position at which the differences occur. Taken together, these results show that many TCR<italic>&#x3b2;</italic>s (indeed, the vast majority of those identified here) are specific to distinct HLA allotypes, regardless of shared peptide repertoire or binding domain similarity. Thus, many characteristics of TCR-pHLA interactions differ among highly related HLA allotypes. As expected, no such specificity was observed among HLA allotypes that differ only in synonymous substitutions (ie, at 3- and 4- digit resolution; <xref ref-type="supplementary-material" rid="SF9">
<bold>Supplementary Figure S9</bold>
</xref>). We note that to mitigate the effects of linkage disequilibrium, our algorithm for identifying ESs assumes TCRs are specific to individual HLA allotypes (see methods). Thus, our methodology is not designed to identify an unbiased set of TCRs specific to multiple HLA allotypes. Ouridentification of a small fraction of ESs with specificity to multiple HLA allotypes warrants a systematic investigation which is beyond the scope of this work.</p>
</sec>
<sec id="s2_2_2">
<title>Most TCRs are specific to class II heterodimers, not subunits</title>
<p>Functional class II HLAs are stable heterodimers with both the <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> chain contacting the peptide. As such, we expect class II HLA-associated TCRs to be specific to the heterodimer and not the protein subunits (i.e. the <italic>&#x3b1;</italic> or <italic>&#x3b2;</italic> chains individually). To directly test this hypothesis, we use the L1LR method to determine if a TCR<italic>&#x3b2;</italic> is more strongly enriched among individuals expressing both the <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> chains or individuals expressing only one or the other subunit. Across 37 heterodimers, we find that <inline-formula>
<mml:math display="inline" id="im1">
<mml:mrow>
<mml:mo>&#x223c;</mml:mo>
<mml:mn>146000</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (70%), <inline-formula>
<mml:math display="inline" id="im2">
<mml:mrow>
<mml:mo>&#x223c;</mml:mo>
<mml:mn>20500</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (10%) and <inline-formula>
<mml:math display="inline" id="im3">
<mml:mrow>
<mml:mo>&#x223c;</mml:mo>
<mml:mn>43000</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (20%) of ESs are most strongly associated with the heterodimer, alpha and beta subunits, respectively. We note that not all 37 heterodimers exhibit single-chain specificity (see below). Thus, the vast majority of class II associated TCR <inline-formula>
<mml:math display="inline" id="im4">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula>s appear to be specific to the combined <inline-formula>
<mml:math display="inline" id="im5">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3b2;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> chains. This finding is bolstered by the fact that the ES sets we derive discriminate HLA-DP and -DQ heterodimers and not individual subunits (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>; see also <xref ref-type="supplementary-material" rid="SF6">
<bold>Supplementary Figures S6</bold>
</xref>-<xref ref-type="supplementary-material" rid="SF7">
<bold>7</bold>
</xref>, which show ES distributions for all heterodimers).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Some TCR<italic>&#x3b2;</italic>s appear to be specific to the class II HLA subunit rather than heterodimer. <bold>(A)</bold> DQA1*01:05+DQB1*05:01 ES counts observed in each sample as a function of sequencing depth. The ESs separate DQA1*01:05+DQB1*05:01 positive subjects from DQA1*01:05+DQB1*05:01 negative subjects. However, subjects who have the DQB subunit appear elevated above the control population of subjects with neither subunit. <bold>(B)</bold> ES count plotted against sequencing depth for the subset of ESs which associate most strongly with DQA1*01:05+DQB1*05:01 heterodimer via the L1LR method. A majority of TCR<italic>&#x3b2;</italic>s which make up the ES set for DQA1*01:05+DQB1*05:01 appear to be specific to the heterodimer. <bold>(C)</bold> ES count plotted against sequencing depth for the subset of ESs which associate most strongly to subunit DQB1*05:01 via the L1LR method. A small fraction of TCR<italic>&#x3b2;</italic>s which make up the ES set for DQA1*01:05+DQB1*05:01 appear to be specific only to the <italic>&#x3b2;</italic> chain subunit. <bold>(D)</bold> Same as <bold>(C)</bold> but color-coding subjects with DQB1*05:01 by their various <bold>
<italic>&#x3b1;</italic>
</bold> chain pairings. This subset of TCR<italic>&#x3b2;</italic>s appear to be specific to all possible heterodimeric combinations which include DQB1*05:01, thus suggesting specificity solely to the <italic>&#x3b2;</italic> chain subunit. Results are shown for train sample and are consistent with holdout sample.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-16-1603730-g002.tif">
<alt-text content-type="machine-generated">Scatter plots depicting enhanced sequence counts versus total unique rearrangements, separated into four panels labeled A, B, C, and D. Each panel contains colored dots representing different data categories, as indicated by their legends. Panels A and B show counts up to 800 and 600, respectively, while panels C and D show counts up to 200. Legends detail specific genetic markers associated with each color.</alt-text>
</graphic>
</fig>
<p>We find that only a subset of ESs and HLAs exhibit exceptions to heterodimeric specificity. For example, some TCR <inline-formula>
<mml:math display="inline" id="im6">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula>s appear to be associated to all heterodimers composed of the DQB1*05:01 subunit, indicating many of these TCR <inline-formula>
<mml:math display="inline" id="im7">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula>s are associated with the subunit itself (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). DQB1*05:01 is the clearest example of TCR specificity to a subunit. However, we observe such subunit specificity across multiple subunits: DPB1*01:01, DQB1*02:01 (DQB1*02:02)<xref ref-type="fn" rid="fn2">
<sup>2</sup>
</xref>, DQB1*03:01, DQB1*05:01, DQB1*06:03, DQA1*03:01 (DQA1*03:03) and DQA1*05:01 (DQA1*05:05). TCR specificity to subunits appears to be more common for the HLA <inline-formula>
<mml:math display="inline" id="im8">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> chain and to the HLA-DQ locus, though we observe single-chain specificity in both the <inline-formula>
<mml:math display="inline" id="im9">
<mml:mi>&#x3b1;</mml:mi>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im10">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> chains of HLA-DQ and a <inline-formula>
<mml:math display="inline" id="im11">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> chain of HLA-DP. We note that our identification is likely not exhaustive as many heterodimers lack enough diversity in one or both subunits to statistically associate TCRs independent of the heterodimer.</p>
<p>Based on a limited set of solved structures, a conserved binding pattern has been proposed for class II TCR-pHLA interactions such that TCR <inline-formula>
<mml:math display="inline" id="im12">
<mml:mi>&#x3b1;</mml:mi>
</mml:math>
</inline-formula> contacts the <inline-formula>
<mml:math display="inline" id="im13">
<mml:mi>&#x3b1;</mml:mi>
</mml:math>
</inline-formula> helix of the HLA <inline-formula>
<mml:math display="inline" id="im14">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> chain and TCR <inline-formula>
<mml:math display="inline" id="im15">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> contacts the <inline-formula>
<mml:math display="inline" id="im16">
<mml:mi>&#x3b1;</mml:mi>
</mml:math>
</inline-formula> helix of the HLA <inline-formula>
<mml:math display="inline" id="im17">
<mml:mi>&#x3b1;</mml:mi>
</mml:math>
</inline-formula> chain (<xref ref-type="bibr" rid="B55">55</xref>). Thus, the various specificity patterns we observe may reflect TCR interactions strongly mediated by peptides and not the direct interactions between TCRs and HLAs which may be conserved. Future analyses based on larger sets of solved or perhaps <italic>in silico</italic> generated structures of class II TCR-pHLA complexes will be informative for exploring the structural basis of the various specificity patterns we identify.</p>
</sec>
</sec>
<sec id="s2_3">
<title>TCR breadth is proportional to zygosity</title>
<p>HLA homozygosity has been epidemiologically linked to poor clinical prognosis in the context of both chronic HIV infection (<xref ref-type="bibr" rid="B56">56</xref>) and cancer checkpoint-inhibitor immunotherapy (<xref ref-type="bibr" rid="B57">57</xref>), possibly due to the reduced size of the HLA-restricted peptide repertoire available for T-cell recognition. This reduced size of the antigen repertoire, coupled with higher relative surface concentration of pHLAs associated with the homozygous protein, may directly impact the TCR repertoire by increasing the probability of clonal expansion of T cells expressing cognate TCRs. Consistent with this hypothesis, we find that the distribution of ES counts is elevated among homozygous individuals (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3A-F</bold>
</xref>). Across all HLAs, the distribution of ESs is(on average) about one standard deviation higher for homozygous as compared to heterozygous individuals (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3G, H</bold>
</xref>). Notably, the ES distribution is an additional standard deviation higher among individuals homozygous at both the <inline-formula>
<mml:math display="inline" id="im18">
<mml:mi>&#x3b1;</mml:mi>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im19">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> locus for HLA-DP or -DQ (&#x201c;double homozygous&#x201d;, <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3H</bold>
</xref>).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Breadth of T cell response is proportional to HLA zygosity. <bold>(A)</bold> A*02:01, <bold>(B)</bold> B*07:02, <bold>(C)</bold> C*04:01, <bold>(D)</bold> DPA1*01:03+DPB1*02:01, <bold>(E)</bold> DQA1*01:02+DQB1*06:02 and <bold>(F)</bold> DRB1*07:01 ESs observed in each sample plotted against total number of unique rearrangements. HLA negative, heterozygous positive and homozygous positive subjects are shown in blue, orange and green, respectively. For HLA-DP and DQ, double homozygous subjects are shown in red. The breadth of the ES response appears to be correlated with homozygosity across all six loci. We quantify the the increased breadth resulting from homozygosity by fitting the mean and standard deviation of the ES counts in heterozygous cases for each HLA as a function of sequencing depth andthen calculating the z-score for all subjects and all well-represented HLAs. We aggregate z-score distributions per-loci for <bold>(G)</bold> class I and <bold>(H)</bold> class II HLAs. Results are shown for train sample and are consistent with holdout sample.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-16-1603730-g003.tif">
<alt-text content-type="machine-generated">Scatter plots (A-F) and box plots (G-H) show genetic variations and statistical distributions. Scatter plots display enhanced sequence counts vs. unique rearrangements, categorized by controls, heterozygous, homozygous, and double homozygous groups. Box plots illustrate Z scores for these groups, color-coded by different categories (A, B, C, DP, DQ, DR), showing data dispersion and outliers.</alt-text>
</graphic>
</fig>
<p>While these results are consistent with increased relative antigen abundance increasing clonal expansion of associated T cells, an alternative hypothesis is that a decrease in the relative surface expression or decreased antigenic diversity in homozygous subjects results in less crowding out by other HLAs or TCRs, respectivly. This crowding hypothesis implies an increased breadth across multiple loci within a given class for homozygous subjects. We test this hypothesis by examining whether a homozygous subject at one locus has higher breadth at another class-matched loci. For example, if HLA and/or TCRs crowd each other, we expect that a subject homozygous for HLA-A will also have a higher average breadth in their HLA-B and/or HLA-C response due to lower diversity at the class I loci. We do not find evidence of such an effect (see <xref ref-type="supplementary-material" rid="SF10">
<bold>Supplementary Figure S10</bold>
</xref>) and thus conclude that crowding out by HLAs and/or TCRs may not be the primary driver of increased breadth unless it is restricted to a particular locus.</p>
<p>Taken together, these results suggest homozygosity at a particular locus increases the breadth of the T-cell response against peptides presented by that HLA, possibly through increased surface expression and antigen presentation.</p>
</sec>
<sec id="s2_4">
<title>Imputing HLA genotype from TCR repertoires</title>
<p>The clear separation of ES counts in HLA cases versus controls implies that HLA allotypes can be easily imputed from HLA-associated TCR <inline-formula>
<mml:math display="inline" id="im20">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula>s alone. To this end, we fit a simple logistic regression model for each HLA allotype observed in at least 30 training samples (representing <inline-formula>
<mml:math display="inline" id="im21">
<mml:mrow>
<mml:mo>&#x223c;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>%</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> expression frequency), predicting whether an individual expresses that HLA as a function of observed ES and total-unique-rearrangement (log) counts (see <xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4A, B</bold>
</xref> for representative examples, <xref ref-type="supplementary-material" rid="SF3">
<bold>Supplementary Figures S3</bold>
</xref>-<xref ref-type="supplementary-material" rid="SF8">
<bold>S8</bold>
</xref> for all HLAs tested). The number of subjects with each HLA allotype based on HLA genotyping and the model performance for each imputed allotype are provided in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref> (class I) and <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref> (class II); model performance is also shown in <xref ref-type="fig" rid="f4">
<bold>Figure 4C</bold>
</xref>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Model performance of class I HLAs.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="left">HLA</th>
<th valign="middle" align="left"/>
<th valign="middle" align="left">Train</th>
<th valign="middle" align="left">Train CV</th>
<th valign="middle" align="left">Holdout</th>
</tr>
<tr>
<th valign="middle" align="left">N Cases</th>
<th valign="middle" align="left">AUCROC</th>
<th valign="middle" align="left">AUCROC</th>
<th valign="middle" align="left">AUCROC</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">A*01:01</td>
<td valign="middle" align="left">763</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*02:01</td>
<td valign="middle" align="left">1314</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*02:02</td>
<td valign="middle" align="left">74</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*02:05</td>
<td valign="middle" align="left">75</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">A*02:06</td>
<td valign="middle" align="left">37</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*03:01</td>
<td valign="middle" align="left">703</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">A*11:01</td>
<td valign="middle" align="left">354</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">A*23:01</td>
<td valign="middle" align="left">231</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*23:17</td>
<td valign="middle" align="left">31</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*24:02</td>
<td valign="middle" align="left">495</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">A*25:01</td>
<td valign="middle" align="left">107</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*26:01</td>
<td valign="middle" align="left">144</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">A*29:02</td>
<td valign="middle" align="left">196</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*30:01</td>
<td valign="middle" align="left">174</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*30:02</td>
<td valign="middle" align="left">133</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*31:01</td>
<td valign="middle" align="left">177</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*32:01</td>
<td valign="middle" align="left">179</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*33:01</td>
<td valign="middle" align="left">74</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">A*33:03</td>
<td valign="middle" align="left">142</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*34:02</td>
<td valign="middle" align="left">60</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">A*36:01</td>
<td valign="middle" align="left">58</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*66:01</td>
<td valign="middle" align="left">40</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*68:01</td>
<td valign="middle" align="left">204</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*68:02</td>
<td valign="middle" align="left">160</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">A*74:01</td>
<td valign="middle" align="left">111</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*07:02</td>
<td valign="middle" align="left">660</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*08:01</td>
<td valign="middle" align="left">559</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*13:02</td>
<td valign="middle" align="left">125</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*14:01</td>
<td valign="middle" align="left">56</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*14:02</td>
<td valign="middle" align="left">175</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*15:01</td>
<td valign="middle" align="left">291</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*15:03</td>
<td valign="middle" align="left">104</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*15:10</td>
<td valign="middle" align="left">72</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*15:16</td>
<td valign="middle" align="left">36</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*18:01</td>
<td valign="middle" align="left">261</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*27:05</td>
<td valign="middle" align="left">169</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">B*35:01</td>
<td valign="middle" align="left">390</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*35:02</td>
<td valign="middle" align="left">53</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.96</td>
</tr>
<tr>
<td valign="middle" align="left">B*35:03</td>
<td valign="middle" align="left">91</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*37:01</td>
<td valign="middle" align="left">65</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*38:01</td>
<td valign="middle" align="left">85</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">B*39:01</td>
<td valign="middle" align="left">71</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*40:01</td>
<td valign="middle" align="left">290</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*40:02</td>
<td valign="middle" align="left">80</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">B*42:01</td>
<td valign="middle" align="left">94</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*44:02</td>
<td valign="middle" align="left">405</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">B*44:03</td>
<td valign="middle" align="left">333</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*45:01</td>
<td valign="middle" align="left">114</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*49:01</td>
<td valign="middle" align="left">123</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*50:01</td>
<td valign="middle" align="left">78</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*51:01</td>
<td valign="middle" align="left">269</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">B*52:01</td>
<td valign="middle" align="left">74</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*53:01</td>
<td valign="middle" align="left">199</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*55:01</td>
<td valign="middle" align="left">95</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*56:01</td>
<td valign="middle" align="left">32</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.96</td>
<td valign="middle" align="left">0.83</td>
</tr>
<tr>
<td valign="middle" align="left">B*57:01</td>
<td valign="middle" align="left">166</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">B*57:03</td>
<td valign="middle" align="left">54</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*58:01</td>
<td valign="middle" align="left">109</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">B*58:02</td>
<td valign="middle" align="left">80</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">C*01:02</td>
<td valign="middle" align="left">208</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">0.96</td>
</tr>
<tr>
<td valign="middle" align="left">C*02:02</td>
<td valign="middle" align="left">209</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.94</td>
</tr>
<tr>
<td valign="middle" align="left">C*02:10</td>
<td valign="middle" align="left">119</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.97</td>
</tr>
<tr>
<td valign="middle" align="left">C*03:02</td>
<td valign="middle" align="left">59</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">1.00</td>
</tr>
<tr>
<td valign="middle" align="left">C*03:03</td>
<td valign="middle" align="left">282</td>
<td valign="middle" align="left">0.96</td>
<td valign="middle" align="left">0.89</td>
<td valign="middle" align="left">0.89</td>
</tr>
<tr>
<td valign="middle" align="left">C*03:04</td>
<td valign="middle" align="left">480</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">0.96</td>
</tr>
<tr>
<td valign="middle" align="left">C*04:01</td>
<td valign="middle" align="left">829</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.98</td>
</tr>
<tr>
<td valign="middle" align="left">C*05:01</td>
<td valign="middle" align="left">446</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.96</td>
<td valign="middle" align="left">0.95</td>
</tr>
<tr>
<td valign="middle" align="left">C*06:02</td>
<td valign="middle" align="left">559</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">C*07:01</td>
<td valign="middle" align="left">763</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">C*07:02</td>
<td valign="middle" align="left">757</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.96</td>
<td valign="middle" align="left">0.97</td>
</tr>
<tr>
<td valign="middle" align="left">C*07:04</td>
<td valign="middle" align="left">73</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.66</td>
<td valign="middle" align="left">0.68</td>
</tr>
<tr>
<td valign="middle" align="left">C*07:18</td>
<td valign="middle" align="left">81</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.96</td>
<td valign="middle" align="left">0.93</td>
</tr>
<tr>
<td valign="middle" align="left">C*08:01</td>
<td valign="middle" align="left">30</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">0.87</td>
</tr>
<tr>
<td valign="middle" align="left">C*08:02</td>
<td valign="middle" align="left">246</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">C*12:02</td>
<td valign="middle" align="left">55</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left">0.94</td>
</tr>
<tr>
<td valign="middle" align="left">C*12:03</td>
<td valign="middle" align="left">246</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.98</td>
</tr>
<tr>
<td valign="middle" align="left">C*14:02</td>
<td valign="middle" align="left">75</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.99</td>
</tr>
<tr>
<td valign="middle" align="left">C*15:02</td>
<td valign="middle" align="left">114</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.84</td>
<td valign="middle" align="left">0.93</td>
</tr>
<tr>
<td valign="middle" align="left">C*15:05</td>
<td valign="middle" align="left">43</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.93</td>
<td valign="middle" align="left">0.98</td>
</tr>
<tr>
<td valign="middle" align="left">C*16:01</td>
<td valign="middle" align="left">320</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.98</td>
</tr>
<tr>
<td valign="middle" align="left">C*17:01</td>
<td valign="middle" align="left">132</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.94</td>
<td valign="middle" align="left">0.94</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The HLA allele and number of subjects with the given HLA are listed in columns 1 and 2, respectively. Columns 3&#x2013;5 indicate model performance when the trained model is evaluated on the train, train CV and holdout data sets, respectively.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Model performance of class II HLAs.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="left">HLA</th>
<th valign="middle" align="left"/>
<th valign="middle" align="left">Train</th>
<th valign="middle" align="left">Train CV</th>
<th valign="middle" align="left">Holdout</th>
<th valign="middle" align="left"/>
</tr>
<tr>
<th valign="middle" align="left">N Cases</th>
<th valign="middle" align="left">AUCROC</th>
<th valign="middle" align="left">AUCROC</th>
<th valign="middle" align="left">AUCROC</th>
<th valign="middle" align="left">In LD</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*01:01</td>
<td valign="middle" align="left">387</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*02:01</td>
<td valign="middle" align="left">796</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*02:02</td>
<td valign="middle" align="left">39</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*03:01</td>
<td valign="middle" align="left">415</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*04:01</td>
<td valign="middle" align="left">1618</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*04:02</td>
<td valign="middle" align="left">571</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*05:01</td>
<td valign="middle" align="left">117</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*06:01</td>
<td valign="middle" align="left">85</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*104:01</td>
<td valign="middle" align="left">101</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*105:01</td>
<td valign="middle" align="left">66</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.93</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*10:01</td>
<td valign="middle" align="left">70</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*11:01</td>
<td valign="middle" align="left">92</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.96</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*13:01</td>
<td valign="middle" align="left">85</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*14:01</td>
<td valign="middle" align="left">55</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*17:01</td>
<td valign="middle" align="left">78</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*01:03+DPB1*18:01</td>
<td valign="middle" align="left">113</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*01:01</td>
<td valign="middle" align="left">461</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*02:01</td>
<td valign="middle" align="left">172</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left">0.57</td>
<td valign="middle" align="left">0.58</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*03:01</td>
<td valign="middle" align="left">71</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*04:01</td>
<td valign="middle" align="left">324</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.57</td>
<td valign="middle" align="left">0.61</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*04:02</td>
<td valign="middle" align="left">96</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.54</td>
<td valign="middle" align="left">0.57</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*05:01</td>
<td valign="middle" align="left">36</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.94</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*09:01</td>
<td valign="middle" align="left">39</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.94</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*105:01</td>
<td valign="middle" align="left">52</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.80</td>
<td valign="middle" align="left">0.79</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*10:01</td>
<td valign="middle" align="left">84</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*11:01</td>
<td valign="middle" align="left">145</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*131:01</td>
<td valign="middle" align="left">39</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*13:01</td>
<td valign="middle" align="left">139</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*14:01</td>
<td valign="middle" align="left">71</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*17:01</td>
<td valign="middle" align="left">143</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:01+DPB1*18:01</td>
<td valign="middle" align="left">35</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.70</td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:02+DPB1*01:01</td>
<td valign="middle" align="left">268</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:02+DPB1*02:01</td>
<td valign="middle" align="left">63</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.61</td>
<td valign="middle" align="left">0.56</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:02+DPB1*04:01</td>
<td valign="middle" align="left">78</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.80</td>
<td valign="middle" align="left">0.84</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:02+DPB1*05:01</td>
<td valign="middle" align="left">102</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*02:06+DPB1*05:01</td>
<td valign="middle" align="left">34</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.96</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*03:01+DPB1*01:01</td>
<td valign="middle" align="left">54</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DPA1*03:01+DPB1*105:01</td>
<td valign="middle" align="left">140</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:01+DQB1*02:01</td>
<td valign="middle" align="left">65</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.80</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:01+DQB1*02:02</td>
<td valign="middle" align="left">78</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.72</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:01+DQB1*03:01</td>
<td valign="middle" align="left">122</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.75</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:01+DQB1*03:02</td>
<td valign="middle" align="left">53</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">0.68</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:01+DQB1*05:01</td>
<td valign="middle" align="left">602</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:01+DQB1*06:02</td>
<td valign="middle" align="left">81</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:01+DQB1*06:03</td>
<td valign="middle" align="left">32</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.94</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*02:01</td>
<td valign="middle" align="left">161</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*02:02</td>
<td valign="middle" align="left">181</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.80</td>
<td valign="middle" align="left">0.77</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*03:01</td>
<td valign="middle" align="left">214</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.72</td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*03:02</td>
<td valign="middle" align="left">102</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.69</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*03:03</td>
<td valign="middle" align="left">41</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.54</td>
<td valign="middle" align="left">0.55</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*03:19</td>
<td valign="middle" align="left">59</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.86</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*04:02</td>
<td valign="middle" align="left">63</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.65</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*05:01</td>
<td valign="middle" align="left">221</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*05:02</td>
<td valign="middle" align="left">149</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*05:03</td>
<td valign="middle" align="left">33</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.85</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*06:02</td>
<td valign="middle" align="left">830</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*06:03</td>
<td valign="middle" align="left">70</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*06:04</td>
<td valign="middle" align="left">184</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:02+DQB1*06:09</td>
<td valign="middle" align="left">135</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:03+DQB1*02:01</td>
<td valign="middle" align="left">46</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.62</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:03+DQB1*02:02</td>
<td valign="middle" align="left">43</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.64</td>
<td valign="middle" align="left">0.59</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:03+DQB1*03:01</td>
<td valign="middle" align="left">62</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.68</td>
<td valign="middle" align="left">0.69</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:03+DQB1*03:02</td>
<td valign="middle" align="left">33</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.62</td>
<td valign="middle" align="left">0.56</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:03+DQB1*05:01</td>
<td valign="middle" align="left">55</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:03+DQB1*06:01</td>
<td valign="middle" align="left">54</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:03+DQB1*06:02</td>
<td valign="middle" align="left">53</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:03+DQB1*06:03</td>
<td valign="middle" align="left">299</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:04+DQB1*05:03</td>
<td valign="middle" align="left">122</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:05+DQB1*05:01</td>
<td valign="middle" align="left">145</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*01:05+DQB1*06:02</td>
<td valign="middle" align="left">30</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.74</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*02:01</td>
<td valign="middle" align="left">74</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*02:02</td>
<td valign="middle" align="left">602</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*03:01</td>
<td valign="middle" align="left">131</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*03:02</td>
<td valign="middle" align="left">64</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*03:03</td>
<td valign="middle" align="left">164</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*04:02</td>
<td valign="middle" align="left">32</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.87</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*05:01</td>
<td valign="middle" align="left">109</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.77</td>
<td valign="middle" align="left">0.66</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*06:02</td>
<td valign="middle" align="left">110</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.96</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*06:03</td>
<td valign="middle" align="left">39</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">0.75</td>
<td valign="middle" align="left">0.79</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*02:01+DQB1*06:04</td>
<td valign="middle" align="left">30</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.93</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:01+DQB1*02:01</td>
<td valign="middle" align="left">59</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">0.77</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:01+DQB1*02:02</td>
<td valign="middle" align="left">49</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:01+DQB1*03:01</td>
<td valign="middle" align="left">78</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:01+DQB1*03:02</td>
<td valign="middle" align="left">442</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:01+DQB1*05:01</td>
<td valign="middle" align="left">55</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.64</td>
<td valign="middle" align="left">0.68</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:01+DQB1*06:02</td>
<td valign="middle" align="left">55</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">0.68</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:02+DQB1*03:03</td>
<td valign="middle" align="left">76</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*02:01</td>
<td valign="middle" align="left">52</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*02:02</td>
<td valign="middle" align="left">120</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*03:01</td>
<td valign="middle" align="left">306</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*03:02</td>
<td valign="middle" align="left">98</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*03:03</td>
<td valign="middle" align="left">40</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left">0.82</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*04:02</td>
<td valign="middle" align="left">30</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">0.71</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*05:01</td>
<td valign="middle" align="left">72</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*03:03+DQB1*06:02</td>
<td valign="middle" align="left">65</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.77</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*04:01+DQB1*02:02</td>
<td valign="middle" align="left">38</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.72</td>
<td valign="middle" align="left">0.79</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*04:01+DQB1*03:01</td>
<td valign="middle" align="left">33</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">0.81</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*04:01+DQB1*03:19</td>
<td valign="middle" align="left">64</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*04:01+DQB1*04:02</td>
<td valign="middle" align="left">241</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*04:01+DQB1*05:01</td>
<td valign="middle" align="left">38</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.66</td>
<td valign="middle" align="left">0.57</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*04:01+DQB1*06:02</td>
<td valign="middle" align="left">49</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.91</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*02:01</td>
<td valign="middle" align="left">639</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*02:02</td>
<td valign="middle" align="left">57</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*03:01</td>
<td valign="middle" align="left">122</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*03:02</td>
<td valign="middle" align="left">63</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*03:03</td>
<td valign="middle" align="left">30</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.93</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*04:02</td>
<td valign="middle" align="left">31</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.69</td>
<td valign="middle" align="left">0.90</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*05:01</td>
<td valign="middle" align="left">80</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">0.72</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*06:02</td>
<td valign="middle" align="left">95</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.83</td>
<td valign="middle" align="left">0.88</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:01+DQB1*06:03</td>
<td valign="middle" align="left">37</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.70</td>
<td valign="middle" align="left">0.80</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*02:01</td>
<td valign="middle" align="left">84</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*02:02</td>
<td valign="middle" align="left">69</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*03:01</td>
<td valign="middle" align="left">601</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*03:02</td>
<td valign="middle" align="left">66</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.94</td>
<td valign="middle" align="left">0.94</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*03:19</td>
<td valign="middle" align="left">116</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*05:01</td>
<td valign="middle" align="left">101</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">0.67</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*06:02</td>
<td valign="middle" align="left">117</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.84</td>
<td valign="middle" align="left">0.82</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*05:05+DQB1*06:03</td>
<td valign="middle" align="left">41</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.73</td>
<td valign="middle" align="left">0.77</td>
<td valign="middle" align="left">No</td>
</tr>
<tr>
<td valign="middle" align="left">DQA1*06:01+DQB1*03:01</td>
<td valign="middle" align="left">40</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*01:01</td>
<td valign="middle" align="left">442</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*01:02</td>
<td valign="middle" align="left">138</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*01:03</td>
<td valign="middle" align="left">49</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*03:01</td>
<td valign="middle" align="left">655</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*03:02</td>
<td valign="middle" align="left">103</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*04:01</td>
<td valign="middle" align="left">421</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*04:02</td>
<td valign="middle" align="left">46</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*04:03</td>
<td valign="middle" align="left">49</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*04:04</td>
<td valign="middle" align="left">190</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*04:05</td>
<td valign="middle" align="left">76</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*04:07</td>
<td valign="middle" align="left">72</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*07:01</td>
<td valign="middle" align="left">750</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*08:01</td>
<td valign="middle" align="left">109</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*08:02</td>
<td valign="middle" align="left">34</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*08:04</td>
<td valign="middle" align="left">93</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*09:01</td>
<td valign="middle" align="left">126</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*10:01</td>
<td valign="middle" align="left">79</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*11:01</td>
<td valign="middle" align="left">388</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*11:02</td>
<td valign="middle" align="left">85</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*11:04</td>
<td valign="middle" align="left">141</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*12:01</td>
<td valign="middle" align="left">154</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*13:01</td>
<td valign="middle" align="left">364</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*13:02</td>
<td valign="middle" align="left">353</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*13:03</td>
<td valign="middle" align="left">95</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*14:54</td>
<td valign="middle" align="left">129</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*15:01</td>
<td valign="middle" align="left">611</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*15:02</td>
<td valign="middle" align="left">75</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*15:03</td>
<td valign="middle" align="left">202</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*16:01</td>
<td valign="middle" align="left">64</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB1*16:02</td>
<td valign="middle" align="left">54</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB3*01:01</td>
<td valign="middle" align="left">654</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB3*01:62</td>
<td valign="middle" align="left">91</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB3*02:02</td>
<td valign="middle" align="left">1005</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB3*03:01</td>
<td valign="middle" align="left">374</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB4*01:01</td>
<td valign="middle" align="left">361</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB4*01:03</td>
<td valign="middle" align="left">1014</td>
<td valign="middle" align="left">0.99</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB5*01:01</td>
<td valign="middle" align="left">677</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB5*01:02</td>
<td valign="middle" align="left">41</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
<tr>
<td valign="middle" align="left">DRB5*02:02</td>
<td valign="middle" align="left">75</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">1.00</td>
<td valign="middle" align="left">Yes</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The HLA allele and number of subjects with the given HLA are listed in columns 1 and 2, respectively. Columns 3&#x2013;5 indicate model performance when the trained model is evaluated on the train, train CV and holdout data sets, respectively. Column 6 indicates whether the heterodimer is observed to be in linkage disequilibrium. HLAs in linkage equilibrium likely result from trans-complementation of the subunits (see main text).</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Robust predictions of hundreds of HLAs solely based on public T cells observed in the repertoire. ES counts for A*02:01 cases and controls plotted against total number of unique rearrangements for <bold>(A)</bold> train and <bold>(B)</bold> holdout samples. The green line indicates the call threshold. <bold>(C)</bold> AUC-ROC of HLA models across each loci sorted by performance. The hashed bars for HLA-DP and -DQ indicate heterodimer resulting from subunits combinations in linkage equilibrium suggesting trans-complementation. We show below that many of these HLAs are likely non-functional. Performance of <bold>(D)</bold> class I and <bold>(E)</bold> class II HLA models as a function of the number of training samples color-coded by loci. Performance correlates with the number of training samples, as expected. HLAs shown by hashed bars in <bold>(C)</bold> are excluded in <bold>(E)</bold>. In <bold>(C-E)</bold> we show performance derived from 5-fold cross validation (CV) of the train sample. CV performance is consistent with holdout performance.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-16-1603730-g004.tif">
<alt-text content-type="machine-generated">Five-panel figure with graphs showcasing sequence data analysis:  1. Panel (A): Scatter plot showing train controls (blue) and train cases (orange) with log-transformed enhanced sequence counts versus total unique rearrangements; a positive correlation line is present. 2. Panel (B): Similar scatter plot for holdout controls and cases, depicting a similar trend. 3. Panel (C): Bar graph of model performance across loci with varying AUC-ROC values, color-coded by loci types. 4. Panel (D): Scatter plot displaying AUC-ROC against the number of cases in training for HLA-A, B, and C loci. 5. Panel (E): Scatter plot for HLA-DP, DQ, and DR loci with similar metrics as panel D.</alt-text>
</graphic>
</fig>
<p>Over all the imputation accuracy is extremely high with area under the receiver operating characteristic curve (AUC-ROC) scores of <inline-formula>
<mml:math display="inline" id="im22">
<mml:mrow>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>0.9</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> for all but 3 of the 120 HLA-A,-B, and -DR allotypes modeled. This accuracy highlights the specificity of HLA ESs,indicating HLAs at these loci can be accurately imputed from immunosequencing alone. Furthermore, this accuracy confirms that HLA <inline-formula>
<mml:math display="inline" id="im23">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> alone is typically sufficient to identify shared antigen specificity of public T cells. Among class I HLAs, HLA-C allotypes are a notable outlier with relatively lower classification performance even among models with a significant number of positive training examples (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4D</bold>
</xref>). We hypothesize that this reduced performance is due in part to the <inline-formula>
<mml:math display="inline" id="im24">
<mml:mrow>
<mml:mo>&#x223c;</mml:mo>
<mml:mn>10</mml:mn>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>-lower surface expression of HLA-C compared to allotypes expressed by other class I genes (<xref ref-type="bibr" rid="B58">58</xref>).</p>
<p>Model performance among HLA-DP and -DQ heterodimers is substantially more variable than performance at the other loci. We find that 8 of the 30 HLA-DP and 37 of 81 of HLA-DQ fail to achieve AUC-ROC scores of &gt; <inline-formula>
<mml:math display="inline" id="im25">
<mml:mrow>
<mml:mn>0.9</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> even among heterodimers expressed in a high number of individuals in our training population (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4E</bold>
</xref>). Notably, HLA-DQ and -DP are the only loci we study with polymorphic <inline-formula>
<mml:math display="inline" id="im26">
<mml:mi>&#x3b1;</mml:mi>
</mml:math>
</inline-formula> chains, suggesting that heterodimer incompatibility may explain the lack of associated TCRs and the corresponding inability to impute expression of these heterodimers. We explore this issue in the next section.</p>
<p>We assess the generalizability of our imputation models and rule out overfitting or data leakage by evaluating model performance on an entirely independent, out-of-distribution cohort of 136 individuals from Kanazawa, Japan. Subjects in this&#xa0;cohort have HLAs genotyped by direct sequencing and none&#xa0;are included in our training or internal holdout sets. This&#xa0;population differs both genetically and geographically from&#xa0;the predominantly U.S.-based training cohort, thus providing a stringent test of the model&#x2019;s generalizability to out-of-distribution data. For this analysis, we use a set of 135 HLAs across all six loci that yield models with cross-validation precision <inline-formula>
<mml:math display="inline" id="im27">
<mml:mrow>
<mml:mo>&gt;</mml:mo>
<mml:mn>0.9</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, recall <inline-formula>
<mml:math display="inline" id="im28">
<mml:mrow>
<mml:mo>&gt;</mml:mo>
<mml:mn>0.8</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im29">
<mml:mrow>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>30</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> positive training cases.</p>
<p>We apply the 135 HLA models to the Japanese cohort, resulting in an average of 8.5 imputations per individual, compared to 11.0 per individual in our internal validation cohort. This difference is expected and reflects the shift in HLA allele frequencies between the Japanese and U.S-based cohorts. Despite these differences, we observe comparable model performance for the subset of overlapping HLAs. The overall F1 score<xref ref-type="fn" rid="fn3">
<sup>3</sup>
</xref> for the Japanese cohort, aggregated across all imputations, is statistically consistent (<inline-formula>
<mml:math display="inline" id="im30">
<mml:mrow>
<mml:mo>&lt;</mml:mo>
<mml:mn>3</mml:mn>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>) to that observed in the internal validation cohort (<inline-formula>
<mml:math display="inline" id="im31">
<mml:mrow>
<mml:mn>0.925</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>0.006</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im32">
<mml:mrow>
<mml:mn>0.940</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>0.002</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, respectively). These results confirm that model performance generalizes across genetic and geographic backgrounds and that the high accuracy we observe is not a consequence of data leakage, but rather reflects a strong HLA-specific signal in TCR repertoires.</p>
</sec>
<sec id="s2_5">
<title>Poor-performing class II models are trans-complemented, non-functional HLAs</title>
<p>HLAs are inherited as a haplotype, such that one full set is inherited on a single chromosome from each parent (<xref ref-type="bibr" rid="B59">59</xref>). The <inline-formula>
<mml:math display="inline" id="im33">
<mml:mi>&#x3b1;</mml:mi>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im34">
<mml:mi>&#x3b2;</mml:mi>
</mml:math>
</inline-formula> chains of HLA-DP and -DQ<xref ref-type="fn" rid="fn4">
<sup>4</sup>
</xref> pair after synthesis, yielding a phenotype of up to four unique heterodimers in each individual: two formed in <italic>cis</italic>, where both subunits are encoded on the same chromosome, and two in <italic>trans</italic>, where the subunits are encoded on opposite chromosomes. Given the high degree of polymorphism observed in HLA-DP and -DQ subunits, it is perhaps unsurprising that some pairs of <italic>&#x3b1;</italic> and <italic>ta</italic> chains do not form stable heterodimers (<xref ref-type="bibr" rid="B60">60</xref>&#x2013;<xref ref-type="bibr" rid="B62">62</xref>). Based on structural and sequence analysis of HLA-DQ, Tollefsen et&#xa0;al. (<xref ref-type="bibr" rid="B62">62</xref>) propose specific group pairings that likely form stable heterodimers (though they note a small number of exceptions to the pairing rules).</p>
<p>In the context of the present study, the proposed existence of incompatible (and thus non-functional) <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> chains implies two testable hypotheses: (1) that co-inheritance of incompatible pairs on the same chromosome will be under strong negative selection (<xref ref-type="bibr" rid="B62">62</xref>); and (2) that incompatible pairs are unable to elicit a T-cell response and thus will not be associated with any public TCR<italic>&#x3b2;</italic>s.</p>
<p>The first hypothesis implies that co-expression of incompatible pairs almost always results from <italic>trans</italic>-complementation; as such, incompatible pairs will be in linkage equilibrium since they are not co-inherited. Conversely, <italic>cis</italic>-complementation should necessarily result in functional pairs thus all pairs forming from subunits in linkage disequilibrium should be functional. For two subunits <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic>, with respective expression frequencies <inline-formula>
<mml:math display="inline" id="im35">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>&#x3b1;</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im36">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>&#x3b2;</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and co-expression frequency <inline-formula>
<mml:math display="inline" id="im37">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>&#x3b2;</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, linkage equilibrium results in an expected co-expression frequency of approximately <inline-formula>
<mml:math display="inline" id="im38">
<mml:mrow>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mi>E</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>&#x3b2;</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mn>2</mml:mn>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>&#x3b1;</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>&#x3b2;</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> (<xref ref-type="bibr" rid="B63">63</xref>). Overall, we find that a majority (75 of 119) HLA-DP and -DQ <italic>alpha + &#x3b2;</italic> pairs appear to be in linkage equilibrium, i.e., not co-inherited (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>; only subunits comprising heterodimers observed in at least 30 individuals are considered). Notably, all of the pairs that Tollefsen et&#xa0;al. (<xref ref-type="bibr" rid="B62">62</xref>) propose to be incompatible are in equilibrium (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Trans-complemented heterodimers may not form stable HLAs. <bold>(A)</bold> Statistical analysis of the marginal-to-joint probability ratio of heterodimers forming from subunits in linkage equilibrium. We identify these heterodimers as those which differ <inline-formula>
<mml:math display="inline" id="im39">
<mml:mrow>
<mml:mo>&gt;</mml:mo>
<mml:mn>5</mml:mn>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> from ratio of 2 expected for genes in linkage equilibrium. We measure an average probability ratio of <inline-formula>
<mml:math display="inline" id="im40">
<mml:mrow>
<mml:mn>1.97</mml:mn>
<mml:mo>&#xb1;</mml:mo>
<mml:mn>0.04</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. Error bars are derived from propagating poisson uncertainties. <bold>(B)</bold> Expected probability of randomly pairing <bold>
<italic>&#x3b1;</italic>
</bold> and <italic>&#x3b2;</italic> chains of DP and DQ heterodimers plotted against the observed joint probabilities. Probabilities are calculated from the normalized inverse frequencies. The probability of randomly pairing is calculated as the product of the observed marginal probabilities of the subunits. The dashed green line is the expected correlation for random trans-complementary pairing. We identify hetorodimers formed from subunits in linkage equilibrium (shown in orange) as in <bold>(A)</bold>. DQ heterodimers formed from pairing of mismatched groups as defined by (<xref ref-type="bibr" rid="B62">62</xref>) are shown with black circles. These mismatched group heterodimers cluster around the dashed green line indicating random trans-complementary pairing. <bold>(C)</bold> DQA1*01:02+DQB1*03:01 is an example of an HLA where we are unable to identify any ESs that separate cases and controls. <bold>(D)</bold> Model performance of HLA-DP and -DQ models including HLAs forming from subunits in linkage equilibrium. Here we show performance derived from 5-fold cross validation (CV) of the train sample which is consistent with holdout performance.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-16-1603730-g005.tif">
<alt-text content-type="machine-generated">Four-panel figure showing various data analyses related to HLA haplotypes. Panel (A): Scatter plot of \( P_{a^*}P_{b}/P_{a+\beta} \) against the number of positive cases with standard deviation shading. Panel (B): Log-log plot comparing observed probability and random pairing probability with a line indicating random trans-complementary pairing. Panel (C): Scatter plot of enhanced sequence count versus total unique rearrangements for controls and cases. Panel (D): Scatter plot of AUC-ROC against the number of positive cases with data for disequilibrium, equilibrium, and mismatched groups. Legends describe plot indicators.</alt-text>
</graphic>
</fig>
<p>Given the tight linkage between genes encoding subunits, any pair expressed in <italic>cis</italic> in at least one individual is likely to be in LD in a large cohort. Consistent with this hypothesis, every individual heterozygous at both the <italic>&#x3b1;</italic> and <italic>a</italic> locus has at least two of four <italic>&#x3b1;/&#x3b2;</italic> pairs in LD; conversely, no individual should have more than two <italic>&#x3b1;/&#x3b2;</italic> pairs in equilibrium. We confirm that no subject in our cohort has more than two heterodimers formed from subunits in linkage equilibrium, as expected. Taken together, we conclude that LD is a strong proxy for <italic>cis</italic>-complementarity, and that, given strong selection pressure, incompatible pairs are only expressed in <italic>trans</italic>.</p>
<p>If incompatible pairs are truly non-functional (with respect to antigen presentation and T-cell recognition), then there should not be any TCR<italic>&#x3b2;</italic>s that are specific to such pairs. As an example, we are unable to identify distinguishing TCR<italic>&#x3b2;</italic>s forDQA1*01:02+DQB1*03:01, which both violates the Tollefsen et&#xa0;al. (<xref ref-type="bibr" rid="B62">62</xref>) pairing rules and is in linkage equilibrium (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5C</bold>
</xref>). Moreover, all of our high-frequency, poor-performing HLA-DP and -DQ imputation models are for heterodimers formingfrom subunits that are in linkage equilibrium, and thus are almost certainly expressed in <italic>trans</italic> (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>; see also <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3C</bold>
</xref>). Moreover, almost all pairs that violate the Tollefsen et&#xa0;al. (<xref ref-type="bibr" rid="B62">62</xref>) pairing rules have lower-than-expectedimputation performance (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>).</p>
<p>Notably, while heterodimer incompatibility implies both linkage equilibrium and poor model performance, not all heterodimers forming from subunits in linkage equilibrium result in poor performing models. Thus, trans-complementation may yield heterodimers which can drive a T-cell response resulting in identifiable TCR<italic>&#x3b2;</italic>s and a high-accuracy imputation model (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>).</p>
<p>Using these results on model performance and gene linkage, we can extend the Tollefsen et&#xa0;al. (<xref ref-type="bibr" rid="B62">62</xref>) pairing rules to the HLA-DP locus: DPA1*02 appears to form unstable heterodimers when paired with DPB1*02 and DPB1*04; DPA1*01 is apparentlyunrestricted, forming stable heterodimers with subunits from all DPB1 groups in our sample.</p>
</sec>
<sec id="s2_6">
<title>HLA associated sequences are memory T cells responding to common antigens</title>
<p>The T-cell repertoire consists of a mixture of naive and memory T cells. In principle, HLA-restricted antigen presentation will bias both thymic selection and clonal expansion, and thus HLA-specific signatures may exist in both compartments. However, ourstatistical approach to identifying HLA-specific public TCR<italic>&#x3b2;</italic>s likely favors identification of TCRs from memory T-cells.</p>
<p>We investigate characteristics of HLA associated sequences by comparing the distribution of ESs observed in the memory and naive compartments sequenced from 45 individuals who were not included in the original study. For each subject, we sequence five separate repertoires: the memory and naive compartments of CD8<sup>+</sup> and CD4<sup>+</sup> T cells, respectively, and the unsorted repertoire. As sequence-based typing was unavailable for these individuals, we treat the imputed HLAs from the the unsorted repertoire as ground truth (limiting to 90 models with &gt;0.95 precision and recall). For each repertoire and each possible HLA, we compute the weighted breadth of the HLA-specific ESs observed in the repertoire. Across all 45 unsorted repertoires, the weighted breadth of both class I and class II ESs is substantially higher for the HLAs an individual expresses compared to those they do not express (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref>; compare HLA-positive to -negative).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Class I and class II associated ESs are TCR<italic>&#x3b2;</italic>s from CD8<sup>+</sup> and CD4<sup>+</sup> memory T cells, respectively. <bold>(A)</bold> Weighted breadth of 90 HLA associated ESs measured in 45 subjects with imputed HLAs. The breadth is sorted by whether the subject has the HLA or not and is then aggregated across all subjects and HLAs. To generate a comparable breadth across HLAs, which have varying number of ESs, we measure the median breadth in controls for all 90 HLAs, which we rescale to a mean of 1. We then normalize the breadth of any given HLA by this value. Breadth measured in <bold>(B)</bold> CD8<sup>+</sup> memory sorted, <bold>(C)</bold> CD8<sup>+</sup> naive sorted, <bold>(D)</bold> CD4<sup>+</sup> memory sorted and <bold>(E)</bold> CD4<sup>+</sup> naive sorted repertoires. We measure slightly elevated breadth in the CD8<sup>+</sup> and CD4<sup>+</sup> naive sorted repertoires for class I and class II HLAs, respectively. This elevation may be due to surface markers not perfectly discriminating naive and memory compartments or to a weak HLA specific signal due to the HLA interactions required for maintaining homeostatic equilibrium of naive T cells (<xref ref-type="bibr" rid="B75">75</xref>).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-16-1603730-g006.tif">
<alt-text content-type="machine-generated">Box plots showing weighted breadth in \(10^{-3}\) for various conditions. (A) Unsorted: HLA Positive and Negative, Class I and II. (B) CD8+ Memory Sort: Class I and II. (C) CD8+ Naive Sort: Class I and II. (D) CD4+ Memory Sort: HLA Positive and Negative, Class I and II. (E) CD4+ Naive Sort: HLA Positive and Negative, Class I and II. Higher values observed in HLA Positive for Class II in several panels.</alt-text>
</graphic>
</fig>
<p>Within the sorted compartments, a striking pattern emerges: in the naive compartments, there is little difference in the breadth of ES specific for an individual&#x2019;s expressed HLAs compared to background (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6C, E</bold>
</xref>), while in the memory compartments, ESs specific to the individuals&#x2019; expressed HLAs have far higher breadth (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6B, D</bold>
</xref>). Moreover, within the memory compartment, CD8<sup>+</sup> cells are closely linked to high relative breadth of class I HLA ESs, while CD4<sup>+</sup> cells are closely linked to high relative breadth of class II HLA ESs. This result provides further confirmation that ESs are correctly mapped to HLAs despite the challenges of HLA LD.</p>
<p>The centrality of the memory compartment in driving our HLA imputation signal raises several additional hypotheses. The first is that clonal expansion increases the likelihood of detection for ESs. This increased likelihood implies that, while ESs are frequently observed in individuals without the associated HLA, they will tend to be at higher repertoire frequency among individuals who do express the HLA. Indeed, we observe a notable increase in the distribution of clonal frequency among cases compared controls (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7A</bold>
</xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Many HLA ESs are T cells responding to common pathogens. <bold>(A)</bold> Cumulative distribution of clone count per unique rearrangement as measured in cases (blue) and controls (orange). ESs are generally more expanded when they are observed in subjects with the restricting HLA. <bold>(B)</bold> Cumulative distribution of the number of unique rearrangements mapping to an ES, i.e., convergent recombination count. ESs show more convergent recombination when observed in cases (blue) as compared to controls (orange). <bold>(C)</bold> Intersection of SARS-CoV-2 specific ESs derived via a FET on samples with PCR labels and HLA ES sets. Blue curves are HLA ES sets derived from samples which include Covid-19 positive subjects and orange curves are from samples with all Covid-19 positive subjects removed. <bold>(D)</bold> Fraction of SARS-CoV-2 ESs observed in subjects relative to the total fraction possible given the ES HLA association determined from intersecting the SARS-CoV-2 ESs with the HLA ES sets. Here we impute HLAs using our models. For <bold>&#x201c;</bold>HLA +<bold>&#x201d;</bold> we only count sequences associated with HLAs inferred for the subject and for <bold>&#x201c;</bold>HLA -<bold>&#x201d;</bold> we only count sequences associated with HLAs that are not inferred for the subject.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-16-1603730-g007.tif">
<alt-text content-type="machine-generated">Four-panel figure illustrating data distribution and analysis related to COVID.   Panel A: Histogram showing cumulative distribution of clone count for cases (blue) and controls (brown).   Panel B: Histogram displaying cumulative distribution of convergent recombination count for cases (blue) and controls (brown).   Panel C: Line graph depicting fraction of COVID-effective sequences overlapping HLA predictive sequences across p-value cutoffs, comparing COVID-positive subjects (blue) and pre-COVID subjects (brown).  Panel D: Box plot showing fraction of possible sequences observed among groups defined by COVID and HLA status, comparing CD8+ (blue) and CD4+ (green) cells.</alt-text>
</graphic>
</fig>
<p>The second hypothesis is that clonal expansion results from antigen exposure, which will also result in polyclonal expansion of T cells that express distinct TCRs that all respond to the same antigen. An extreme form of polyclonal expansion is <italic>convergent recombination</italic>, in which multiple, distinct TCR DNA sequences encode identical amino acid sequences. Consistent with this hypothesis, the per-ES convergent recombination rates are higher when ESs are observed in cases as compared to controls (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7B</bold>
</xref>; conditional on the ES being present in the repertoire).</p>
<p>The publicity of HLA ESs combined with their apparent antigen-specific clonal expansion suggests that these sequences are responding to antigens which are common in the human population (<xref ref-type="bibr" rid="B64">64</xref>). We test this hypothesis in the context of SARS-CoV-2 exposure. Because of its novel nature, SARS-CoV-2 is especially well-suited for this task as we are able to confidently assign Covid-19 negativity to samples collected before 2020. In our training sample for deriving HLA restricted sequences, 694 ofthe 4,144 subjects (~ 20%) are Covid-19 positive based on PCR labels; the remaining samples are collected before 2020 and thus Covid-19 negative. Because SARS-CoV-2 exposure is relatively high in our training sample, we expect that some of the HLA-specific ESs we identity are SARS-CoV-2 specific.</p>
<p>We identify 6866 SARS-CoV-2-specific ESs using a set of 1523 SARS-CoV-2 PCR-positive samples that have no overlap with the typed HLA training samples and 4386 controls (1008 controls overlap with the typed HLA samples). A high proportion (80% of the most confident SARS-CoV-2 specific ESs) are also HLA-specific ESs (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7C</bold>
</xref>, blue line). This overlap in ESs results from the fact that ~ 20% of our typed HLA training samples are SARS-CoV-2 positive, i.e., SARS-CoV-2 specific ESs are predictiveof HLAs as well. In contrast, if we define an alternative set of HLA-ESs using only 3,450 repertoires which were sampled prior to 2020, we find very little overlap (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7C</bold>
</xref>, orange line). The limited overlap we do observe may be due to cross-reactivityto homologous epitopes from other coronaviruses and/or false positive sequences in the SARS-CoV-2/HLA ES set.</p>
<p>The intersection of SARS-CoV-2 specific ES set with the and HLA specific ES sets yields 1,880 TCR<italic>&#x3b2;</italic>s (using a threshold of <inline-formula>
<mml:math display="inline" id="im41">
<mml:mrow>
<mml:msup>
<mml:mi>p</mml:mi>
<mml:mo>*</mml:mo>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mi>p</mml:mi>
<mml:mo>&lt;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>) that are associated with a particular HLA in the context of SARS-CoV-2 infection. Thus, these ESs are almost certainly specific to commonly targeted SARS-CoV-2 T-cell epitopes. To confirm this specificity, we impute HLAs for samples in the SARS-CoV-2 training data<xref ref-type="fn" rid="fn5">
<sup>5</sup>
</xref> and then compute the fraction of HLA-associated SARS-CoV-2 ES observed in their repertoire. For &#x201c;HLA +&#x201d; and &#x201c;HLA -&#x201d; subjects we only count sequences if the subject has or does not have the HLA which the SARS-CoV-2 ES is associated with, respectively. Notably, both class-I and class-II associated TCR<italic>&#x3b2;</italic>s are far more commonly observed in individuals with the restricting HLA and known SARS-CoV-2 infection (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7D</bold>
</xref>), thus confirming the HLA- and pathogen-specificity of these TCR<italic>&#x3b2;</italic>s and further demonstrating that while TCR<italic>&#x3b2;</italic>s may be cross-reactive to many distinct antigens, the likelihood of cross-reactivity <italic>in vivo</italic> is low (<xref ref-type="bibr" rid="B65">65</xref>).</p>
<p>We conclude that, taken together, these results demonstrate that the majority of HLA-specific ESs are the result of clonal expansion of T cells responding to common antigens, thus establishing an immunological foundation for HLA imputation from TCR<italic>&#x3b2;</italic>repertoires.</p>
</sec>
</sec>
<sec id="s3" sec-type="discussion">
<title>Discussion</title>
<p>The T-cell repertoire of any individual consists of ~ 10<sup>8</sup> unique TCRs out of an estimated ~ 10<sup>16</sup> possibilities (<xref ref-type="bibr" rid="B66">66</xref>, <xref ref-type="bibr" rid="B67">67</xref>), of which only <inline-formula>
<mml:math display="inline" id="im42">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mn>5</mml:mn>
</mml:msup>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mn>6</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> TCRs may be practically sampled from any single repertoire using current techniques. Given the enormous diversity of possible TCRs, naively, little overlap in the TCR repertoire of different subjects may be expected. However, several factors significantly increase the likelihood of observing public TCRs: (1) the probability distribution of TCRs generated via V(D)J recombination is non-uniform and spans ~ 25 orders of magnitude (<xref ref-type="bibr" rid="B68">68</xref>), such that higher generation probability TCRs are more commonly observed in the naive repertoire; (2) antigen-experienced T cells clonally expand and are thus more likely to be observed in a repertoire; and (3) the immune response is focused on only a few immunogenic epitopes per HLA out of the many possible derived from any given antigenic exposure, an effect called <italic>immunodominance</italic> (<xref ref-type="bibr" rid="B69">69</xref>). As a consequence, the likelihood of observing the same TCRs in the repertoires of multiple subjects with shared antigenic exposure and appropriate restricting HLA is significantly higher than naively expected. Studies have shown that public TCRs can be identified that permit sensitive and specific diagnosis of individuals with past SARS-CoV-2 infection (<xref ref-type="bibr" rid="B37">37</xref>) and Lyme disease (<xref ref-type="bibr" rid="B38">38</xref>) as well as to determine who is seropositive for Cytomegalovirus (<xref ref-type="bibr" rid="B35">35</xref>). Given that these antigens are presented by HLAs, it is perhaps unsurprising that these public TCRs are also specific to the HLA context (<xref ref-type="bibr" rid="B35">35</xref>, <xref ref-type="bibr" rid="B36">36</xref>). Here we leverage this public fingerprint of TCRs to identify HLA associatedsequences, allowing us to impute HLA types with extremely high accuracy and opening a new window into functional characteristics of HLAs.</p>
<p>We identify HLA specific TCR using only the TCR<italic>&#x3b2;</italic> repertoire, even though the specificity of pHLA is to TCR<italic>&#x3b1;&#x3b2;</italic>. Enhanced sequences elicit an immune response only in subjects with the appropriate shared restricting HLA and pathogenic exposure history (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7D</bold>
</xref>), meaning, enhanced sequences are responding to the same pHLAs in different subjects. This result implies that an observed TCR<italic>&#x3b2;</italic> shared among multiple subjects in a given HLA context is very likely paired with one or a very small set of compatible TCR<italic>&#x3b1;</italic>s. In this respect, TCR<italic>&#x3b2;</italic> repertoires are not unique; analysis of TCR<italic>&#x3b1;</italic> repertoires would lead to similar results and conclusions as presented here<xref ref-type="fn" rid="fn6">
<sup>6</sup>
</xref>. Thus, our ability to identify HLA specific TCRs using only a single chain of the TCR heterodimer is not a characteristic of the TCR<italic>&#x3b2;</italic>s but rather a consequence of our procedure for identifying enhanced sequences and the relevant underlying biological processes.</p>
<p>A key finding of this work is that TCRs are typically specific to HLA allotypes (two field resolution) and to class II heterodimers encoded by both the <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> chains, although there are some notable exceptions of TCR<italic>&#x3b2;</italic>s that are specific to HLA groups (one field resolution) or to either the <italic>&#x3b1;</italic> or <italic>&#x3b2;</italic> subunits of HLA-DP and -DQ. While most HLAs elicit a strong and diverse public TCR response, others elicit little or no response, consistent with these HLAs deriving from incompatible <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> subunits and providing further support for the widespread prevalence of non-functional class II heterodimeric pairs resulting from trans-complementation. Furthermore, we find that the breadth of an HLA-specific TCR<italic>&#x3b2;</italic> response is larger among individuals expressing two (or more) copies of the HLA, suggesting a dose-dependent effect of antigenic exposure on the diversity of expanded T-cell clones. These insights highlight the exquisite specificity of public TCR<italic>&#x3b2;</italic>s and demonstrate the potential of population-level TCR analysis for probing functional aspects of the immune system.</p>
<p>We show that class I and class II HLA-associated TCR<italic>&#x3b2;</italic>s are found on CD8<sup>+</sup> and CD4<sup>+</sup> memory T cells, respectively, which is consistent with their publicity resulting from clonal expansion in response to antigenic-exposure. The public nature of these TCR<italic>&#x3b2;</italic>s suggests that they are likely specific to peptides derived from common pathogens, vaccines and conserved endogenous-antigens. Consistent with this hypothesis, ~20% of subjects in our training sample are covid positive and we identify a consequently large fraction of SARS-CoV-2-specific TCR<italic>&#x3b2;</italic>s as HLA associated. Notably, this overlap provides probable pathogenic and HLA assignments to these TCR<italic>&#x3b2;</italic>s, as demonstrated by the profound enrichment of these TCR<italic>&#x3b2;</italic>s only among SARS-CoV-2-positive individuals expressing the appropriate restricting HLA. Thus, while only a subset of HLA-associated TCRs are observed in any given individual, the particular TCR<italic>&#x3b2;</italic> subset observed reflects that individual&#x2019;s history of exposure to many common antigens.</p>
<p>Our results imply that the vast majority of HLA-associated TCR<italic>&#x3b2;</italic>s identified in this study likely derive from common antigens, making HLA-association a critical step in decoding the human T-cell repertoire. Moreover, the high imputation accuracy of our HLA models allows us to statistically HLA type all repertoires ever sequenced, thereby expanding the effective size of HLA-typed and TCR-sequenced cohorts by several orders of magnitude and further facilitating decoding efforts. The TCR repertoire is a Rosetta Stone of the human immune system, providing a rich source of information for characterizing both the genetic background and exposure history of individuals at a population scale (<xref ref-type="bibr" rid="B70">70</xref>, <xref ref-type="bibr" rid="B71">71</xref>). Mapping TCRs to HLAs and disease exposures and imputing HLA and disease exposure from TCRs represent important steps toward decoding the immunological history of individuals using immunosequencing.</p>
</sec>
<sec id="s4" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="s4_1">
<title>Human samples</title>
<p>TCR<italic>&#x3b2;</italic> and HLA sequence data from human samples used for these studies were aggregated from several independent study collections described below. All necessary patient/participant consent has been obtained for each study and the appropriate institutional forms have been archived.</p>
<list list-type="order">
<list-item>
<p>Whole blood samples from DLS (Discovery Life Sciences, Huntsville, AL) were collected under Protocol DLS13 for collection of clinical samples.</p>
</list-item>
<list-item>
<p>PBMC used for the sorted repertoire experiments were collected and processed by Bloodworks Northwest (Seattle, WA). Volunteer donors were consented and collected under the Bloodworks Research Donor Collection Protocol BT001.</p>
</list-item>
<list-item>
<p>PBMC were obtained from the Fred Hutchinson Cancer Research Center Research Cell Bank biorepository of healthy bone marrow donors. The sample collection protocol was approved and supervised by the Fred Hutchinson Cancer Research Center Institutional Review Board (IRB) (<xref ref-type="bibr" rid="B35">35</xref>).</p>
</list-item>
<list-item>
<p>Blood collected from human subjects were approved by the IRBs of Johns Hopkins University and Stanford University. All participants provided written informed consent prior to enrollment (<xref ref-type="bibr" rid="B38">38</xref>).</p>
</list-item>
<list-item>
<p>Blood collected for the ImmuneRACE Study has been approved by the Western IRB (WIRB) (reference number 1-1281891-1). The trial has received appropriate ethical approval from WIRB as described (<xref ref-type="bibr" rid="B72">72</xref>).</p>
</list-item>
<list-item>
<p>Procedures for the INCOV study were approved by the IRBs at Providence St. Joseph Health with IRB study number STUDY2020000175, the WIRB with IRB study number 20170658, and the University of Washington with IRB study numbers STUDY00000959 and STUDY00002929 (<xref ref-type="bibr" rid="B73">73</xref>).</p>
</list-item>
<list-item>
<p>Human samples from the Virology Research Clinic at the University of Washington was collected under an IRB-approved study (NCT04338360) (<xref ref-type="bibr" rid="B53">53</xref>).</p>
</list-item>
<list-item>
<p>Blood from the Institute of Medical, Pharmaceutical, and Health Sciences, Kanazawa University (KU) was collected with informed consent as described by documents approved by the KU review board (document number 585-2).</p>
</list-item>
</list>
</sec>
<sec id="s4_2">
<title>TCR sequencing</title>
<p>We use the ImmunoSEQ assay developed by Adaptive Biotechnologies to measure the TCR<italic>&#x3b2;</italic> repertoire. ImmunoSEQ is a multiplexed PCR-based method targeting rearranged TCR<italic>&#x3b2;</italic> sequences (<xref ref-type="bibr" rid="B45">45</xref>). The assay uses a panel of primers specific to all functional TRBV and TRBJ gene segments to amplify the full V(D)J region, including part of the TRBV segment, the entire diversity (D) and a portion of the J segment. The sequenced portions of the V and J segments are sufficient to determine gene usage. This region also includes the complete hypervariable complementarity-determining region 3 (CDR3), which accounts for most of the TCR diversity and is the key determinant of TCR antigen specificity. The reverse primer binds near the 3&#x2032; end of the J region, adjacent to the constant region and may extend into the 5&#x2032; end of the TCR. PCR primers contain universal priming sites on the 3&#x2032;-end and Illumina sequencing adaptors on the 5&#x2032;-end. This design enables robust amplification across a wide range of rearrangements while controlling for bias. High-throughput sequencing of these amplicons provides accurate quantification of unique TCR<italic>&#x3b2;</italic> clonotypes.</p>
<p>Flow cytometry and cell sorting <inline-formula>
<mml:math display="inline" id="im43">
<mml:mrow>
<mml:mn>3</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mn>7</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> PBMC were stained using a cocktail of antibodies that included CD3 (clone UCHT1, Biolegend), CD4 (clone OKT4, Biolegend), CD8 (clone RPA-T8, Biolegend), CD45RA(clone HI100, BD Bioscience), CCR7 (clone G043H7, Biolegend), CD95 (clone DX2, Biolegend), and CD28 (clone CD28.2, Biolegend) for 10 minutes at 4 degrees C. PBMC were washed with MACS buffer (Miltenyi Biotec) and then PE+ CD3+ T cells were enriched using anti-PE Microbeads with LS columns (Miltenyi Biotec) following the manufacturer&#x2019;s protocol. The enriched CD3 sample was sorted using a FACSAria Fusion Flow Cytometer (BD Biosciences) to isolate naive CD4 (CD4<sup>+</sup> CD3<sup>+</sup> CD45RA<sup>+</sup> CD95<sup>&#x2013;</sup> CD28<sup>+</sup> CCR7<sup>+</sup>), memory CD4 (CD4<sup>+</sup> CD3<sup>+</sup> non-naive CD4), naive CD8 (CD8<sup>+</sup> CD3<sup>+</sup> CD45RA<sup>+</sup> CD95<sup>&#x2013;</sup> CD28<sup>+</sup> CCR7<sup>+</sup>) and memory CD8 (CD8<sup>+</sup>CD3<sup>+</sup> non-naive CD8). Between 150,000 and <inline-formula>
<mml:math display="inline" id="im44">
<mml:mrow>
<mml:mn>3</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mn>6</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> T cells were sorted and sent in for sequencing for each subset. TCR<italic>&#x3b2;</italic> sequencing was carried out using the ImmunoSEQ assay at Adaptive Biotechnologies.</p>
</sec>
<sec id="s4_3">
<title>Model training</title>
<p>We independently train a model for each HLA using the following procedure:</p>
<list list-type="order">
<list-item>
<p>We randomly split 80% and 20% of all typed samples into a training and holdout set.</p>
</list-item>
<list-item>
<p>Using typed HLA data, we label all samples as cases, controls or unlabeled for the HLA being modeled.</p>
</list-item>
<list-item>
<p>We derive an ES set using the FET applied to cases and controls.</p>
</list-item>
<list-item>
<p>We select a subset of ESs which associate to the HLA being modeled via the L1LR method.</p>
</list-item>
<list-item>
<p>We derive an individual weight for each sequence in the list of ESs from step 3).</p>
</list-item>
<list-item>
<p>We generate two features which are the logarithm of the weighted sum of the convergent recombination count (i.e., number of unique DNA rearrangements mapping to a given CDR3) of enhanced sequences and the total unique rearrangements in the repertoire, respectively.</p>
</list-item>
<list-item>
<p>We fit the standard Scikit-Learn logistic regression classifier to the training data and evaluate the model in cross validation to select the best FET p-value cutoff.</p>
</list-item>
<list-item>
<p>We train the final model on all the train data and evaluate on the holdout set.</p>
</list-item>
</list>
<p>Below we describe training steps in detail using the following definitions: Let <italic>H</italic> be the set of <italic>N<sub>H</sub>
</italic> typed HLA allotypes in our training set and <inline-formula>
<mml:math display="inline" id="im45">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im46">
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>H</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> refer to any single HLA in the set. The training set of <italic>h<sub>i</sub>
</italic> is denoted as <inline-formula>
<mml:math display="inline" id="im47">
<mml:mrow>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> where <italic>T</italic> is the set of <italic>N<sub>T</sub>
</italic> training samples. We similarly define a test (or holdout) set for each HLA <inline-formula>
<mml:math display="inline" id="im48">
<mml:mrow>
<mml:msubsup>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msubsup>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi>T</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> where <italic>T</italic>&#x2032; is the set of <inline-formula>
<mml:math display="inline" id="im49">
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:msup>
<mml:mi>T</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> holdout samples. Below we drop the subscript <italic>i</italic> unless needed for clarity as the procedure is applied to each HLA independently.</p>
<p>Step 1: <italic>T</italic> and <italic>T</italic>&#x2032; are derived from a random 80/20 split of all typed data with <inline-formula>
<mml:math display="inline" id="im50">
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>T</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:msup>
<mml:mi>T</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>4</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>144</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. <xref ref-type="supplementary-material" rid="SF1">
<bold>Supplementary Figure S1</bold>
</xref> shows the age, sex and ethnicity distribution of sample subjects.</p>
<p>Step 2: When building a model for a given HLA <inline-formula>
<mml:math display="inline" id="im51">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, samples are labeled as cases (label = 1) or controls (label = 0) if a subject expresses or does not express <inline-formula>
<mml:math display="inline" id="im52">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, respectively. A subset of controls are unlabeled if a <ext-link ext-link-type="uri" xlink:href="http://hla.alleles.org/alleles/p_groups.html">p-group matched HLA</ext-link> to <inline-formula>
<mml:math display="inline" id="im53">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is expressed by the subject. P-group matched HLAs share the same antigen binding domain and thus may share T-cell receptor (TCR) specificities.</p>
<p>Step 3: For any HLA <italic>h</italic>, an initial set of ESs, <italic>E</italic>, is defined using Fisher&#x2019;s Exact Test (FET) [<xref ref-type="bibr" rid="B74">74</xref>] applied to training set <italic>t</italic> of HLA <italic>h</italic>. The a range of p-value thresholds are used to identify ESs and the threshold is treated as ahyperparameter in the modeling; it is independently derived for each HLA we model.</p>
<p>Step 4: If HLA <italic>h</italic> is in linkage disequilibrium (LD) with other HLAs, the enhanced sequences specific to HLAs in LD will be present in the ES set of HLA <italic>h</italic> because of their co-occurrence in subjects (this is how LD is defined). The goal of our procedure is to identify and remove these sequences from the final set of ESs associated to <italic>h</italic>. Thus, a fundamental assumption of the model is that for a given train set, an ES may be associated with only a single HLA.</p>
<p>We enforce the assumption that each TCR<italic>&#x3b2;</italic> is specific to one HLA by fitting a logistic regression model with L1 regularization and we refer to this as the L1LR method. We independently associate each ES in <italic>E</italic> with a single HLA. Thus, the assumption that a given TCR<italic>&#x3b2;</italic> is associated to a single HLA is not globally enforced, i.e., it is possible that due to variations in training data that the same TCR<italic>&#x3b2;</italic> may be associated to multiple HLAs though this is rare (see <xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figure S2</bold>
</xref>).</p>
<p>When associating individual ESs to HLAs, we model the presence/absence of any given ES <inline-formula>
<mml:math display="inline" id="im54">
<mml:mrow>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>E</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> in the training set <italic>t</italic> as a logistic regression classification. Here <italic>j</italic> denotes the individual TCR<italic>&#x3b2;</italic>s in the ES set. For any sample <inline-formula>
<mml:math display="inline" id="im55">
<mml:mrow>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, where <italic>l</italic> denotes individual samples in the training set <italic>t</italic>, the label for sequence <inline-formula>
<mml:math display="inline" id="im56">
<mml:mrow>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is either 0 or 1 if the sequences is present or absent in <inline-formula>
<mml:math display="inline" id="im57">
<mml:mrow>
<mml:msub>
<mml:mi>t</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, respectively. The feature vector for associating a given ES <inline-formula>
<mml:math display="inline" id="im58">
<mml:mrow>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> includes the indicator vector for the typed set of HLAs, i.e. <inline-formula>
<mml:math display="inline" id="im59">
<mml:mrow>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> if sample <italic>l</italic> expresses HLA <inline-formula>
<mml:math display="inline" id="im60">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im61">
<mml:mrow>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> if sample <italic>l</italic> does not express HLA <inline-formula>
<mml:math display="inline" id="im62">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. Here, <italic>k</italic> indicates the subset of HLAs in <italic>H</italic> is in LD with HLA <italic>h</italic> (defined by FET p-value &lt; <inline-formula>
<mml:math display="inline" id="im63">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>). Thus, the feature vector is a binary vector indicating whether a subject has or does not have a given HLA which is observed to co-occur with the HLA being modeled. When associating sequences we include the total number of unique rearrangements in each sample repertoire, <inline-formula>
<mml:math display="inline" id="im64">
<mml:mrow>
<mml:msub>
<mml:mi>d</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as a covariate not subject to L1 regularization. We&#xa0;model each ES independently and thus drop the subscript <italic>j</italic> in the following for clarity. Taken together a single ES <italic>e</italic> is modeled such that.</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>label</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:munder>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>l</mml:mi>
</mml:munder>
<mml:mi>&#x3b1;</mml:mi>
<mml:msub>
<mml:mi>d</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>&#x3bb;</mml:mi>
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>k</mml:mi>
</mml:munder>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mi>b</mml:mi>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq1">Equation 1</xref>, <italic>&#x3b1;</italic> and <italic>&#x3b2;</italic> are free parameters, <italic>b</italic> is the bias term and <italic>&#x3bb;</italic> is the regularization strength applied to <italic>&#x3b2;</italic>. We find the best-fit parameters by minimizing the log-loss and tune <italic>&#x3bb;</italic> to be the smallest value that yields precisely one non-zero coefficient in <inline-formula>
<mml:math display="inline" id="im65">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. If the non-zero coefficient is <inline-formula>
<mml:math display="inline" id="im66">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, then the sequence is associated with the HLA being modeled and is retained as part of the final ES set. If the non-zero coefficient is <inline-formula>
<mml:math display="inline" id="im67">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x2260;</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. the sequences is excluded from the final ES set of HLA <italic>h</italic> which is denoted as <inline-formula>
<mml:math display="inline" id="im68">
<mml:mover accent="true">
<mml:mi>E</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula>. We weight each sample by the square root of the convergent recombination count when finding the best-fit parameters and zero count samples are given a weight of unity. The effectiveness of our procedure to resolve LD is demonstrated in <xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figure S2</bold>
</xref>.</p>
<p>Step 5: We derive a per-sequence weight, <inline-formula>
<mml:math display="inline" id="im69">
<mml:mrow>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> for each sequence <inline-formula>
<mml:math display="inline" id="im70">
<mml:mrow>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mover accent="true">
<mml:mi>E</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> by fitting a two feature logistic regression classifier. Here <italic>j</italic> refers to individual sequences in <inline-formula>
<mml:math display="inline" id="im71">
<mml:mover accent="true">
<mml:mi>E</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula>. Each sequence is fit independently. For each sequence the target of the classifier is whether the sample is a case or control of HLA <inline-formula>
<mml:math display="inline" id="im72">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and the features are the convergent recombination count of the sequence and total number of unique rearrangements in the given repertoire sample. Essentially, we build a model to discriminate cases from controls using the count of a single sequence and take the coefficient as a weight. In detail, we standardize the features by subtracting the mean and normalizing to the standard deviation of the features across all samples. We fit the default logistic regression model in the <ext-link ext-link-type="uri" xlink:href="https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html">Scikit-learn</ext-link> library which includes a fixed amount of L2 regularization (<inline-formula>
<mml:math display="inline" id="im73">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>). This procedure yields a weight for each sequence in <inline-formula>
<mml:math display="inline" id="im74">
<mml:mrow>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mover accent="true">
<mml:mi>E</mml:mi>
<mml:mo>&#x2dc;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>Step 6: The final classifier model is a two feature model where the features <italic>F</italic> for subject <italic>l</italic> are.</p>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mtext>log</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>j</mml:mi>
</mml:munder>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>&#xa0;log</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In <xref ref-type="disp-formula" rid="eq2">Equation 2</xref> <inline-formula>
<mml:math display="inline" id="im75">
<mml:mrow>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the convergent recombination count of <inline-formula>
<mml:math display="inline" id="im76">
<mml:mrow>
<mml:msub>
<mml:mi>e</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> in sample <italic>l</italic>. These features, <inline-formula>
<mml:math display="inline" id="im77">
<mml:mrow>
<mml:msub>
<mml:mi>F</mml:mi>
<mml:mi>l</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, are used in a the standard Scikit-learn logistic regression to predict the presence/absence of an HLA for a given sample.</p>
<p>Step 7: To model any given HLA, we fit the standard Scikit-Learn logistic regression classifier using features generated in Step 6). We treat the p-value cutoff for identifying ESs via the FET as described in Step 3) as a hyperparameter of each HLA model. We train and evaluate a model using a five-fold cross validation strategy for p-value cutoffs = <inline-formula>
<mml:math display="inline" id="im78">
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>6</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>7</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>8</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. We adopt p-value cutoff of the highest performing cross-validation model.</p>
<p>Step 8: We generate our final model by adopting the p-value threshold determined in step 7) and train on the full set of training data. We evaluate the final model on the holdout set (<xref ref-type="supplementary-material" rid="SF3">
<bold>Supplementary Figure S3</bold>
</xref>&#x2013;<xref ref-type="supplementary-material" rid="SF8">
<bold>S8</bold>
</xref>).</p>
</sec>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>A subset of the raw data sufficient to reproduce the results of this study is publicly available from Adaptive Biotechnologies at <ext-link ext-link-type="uri" xlink:href="https://clients.adaptivebiotech.com/pub/Emerson-2017-NatGen">https://clients.adaptivebiotech.com/pub/Emerson-2017-NatGen</ext-link>. The remaining data were generated by Adaptive Biotechnologies and are subject to their data sharing policies.</p>
</sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>There are multiple cohorts used in the paper and the IRBs are listed. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>HZ: Conceptualization, Data curation, Investigation, Formal analysis, Methodology, Project administration, Software, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. RT: Conceptualization, Methodology, Investigation, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. PE: Conceptualization, Investigation, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. I-TC: Conceptualization, Methodology, Investigation, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. CG: Resources, Data curation, Software, Writing &#x2013; review &amp; editing. JL: Resources, Data curation, Software, Writing &#x2013; review &amp; editing. LP: Resources, Data curation, Software, Writing &#x2013; review &amp; editing. MR: Validation, Writing &#x2013; review &amp; editing. RE: Validation, Writing &#x2013; review &amp; editing. HT: Validation, Writing &#x2013; review &amp; editing. WZ: Project administration, Supervision, Writing &#x2013; review &amp; editing. JG: Conceptualization, Methodology, Writing &#x2013; review &amp; editing, Supervision. HR: Conceptualization, Funding acquisition, Resources, Supervision, Writing &#x2013; review &amp; editing. JC: Conceptualization, Resources, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing.</p>
</sec>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research and/or publication of this article.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We are grateful to Jonathan Duke-Cohan for his careful and engaged editorial oversight of the manuscript. We thank Mary Carrington for discussion and helpful feedback which improved the manuscript and Thomas Snyder for guidance during early stages of manuscript drafting. We also thank the reviewers who provided helpful feedback that improved the clarity of the manuscript.</p>
</ack>
<sec id="s9" sec-type="memoriam">
<title>In memoriam</title>
<p>This paper is dedicated to the memory of Peter Jacob Robert Ebert (1978 &#x2013; 2023). He marched to his own drumbeat and was unconcerned with popular opinions. His intellectual curiosity, independence and rigor made him an innovative scientific leader and a wonderful collaborator. He was not only an incredibly clever scientist, but also a funny and kind colleague who will be missed by all who had the privilege to know him.</p>
</sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>HZ, CG, JL, LP, JG, JC were employed by Microsoft. RT, PE, I-TC, MR, RE, WZ, HR were employed by Adaptive Biotechnologies.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s13" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fimmu.2025.1603730/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fimmu.2025.1603730/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Presentation1.pdf" id="SF1" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;1</label>
<caption>
<p>Demographic distribution of sample population. <bold>(A)</bold> Age, <bold>(B)</bold> sex and <bold>(C)</bold> self-reported ethnicity distribution of sample subjects.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF2" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;2</label>
<caption>
<p>Effectiveness of L1LR method to resolve LD. Heatmap showing the amount of TCR<italic>&#x3b2;</italic> sharing before (left) and after (right) applying L1LR method to resolve LD. The color indicates the fractional sharing of TCR<italic>&#x3b2;</italic>s amongst pairs of HLAs relative to the total number of TCR<italic>&#x3b2;</italic>s associated with the HLA indicated on the vertical axis. After accounting for LD, we observe significantly less sharing of TCR<italic>&#x3b2;</italic>s amongst HLA allotypes. The remaining shared TCR<italic>&#x3b2;</italic>s may be the result of LD that is too strong to resolve using our method or true sharing of TCR<italic>&#x3b2;</italic>s between multiple HLAs (e.g., as shown in the main text).</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF3" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;3</label>
<caption>
<p>HLA-A models. Left column shows the precision-recall curve for the trained model evaluated on the train sample (middle left), train sample in cross-validation (middle right) and on the holdout sample (right) for HLA-A. The green line indicates the calibration threshold.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF4" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;4</label>
<caption>
<p>HLA-B models. Left column shows the precision-recall curve for the trained model evaluated on the train sample (middle left), train sample in cross-validation (middle right) and on the holdout sample (right) for HLA-B. The green line indicates the calibration threshold.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF5" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;5</label>
<caption>
<p>HLA-C models. Left column shows the precision-recall curve for the trained model evaluated on the train sample (middle left), train sample in cross-validation (middle right) and on the holdout sample (right) for HLA-C. The green line indicates the calibration threshold.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF6" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;6</label>
<caption>
<p>HLA-DP models. Left column shows the precision-recall curve for the trained model evaluated on the train sample (middle left), train sample in cross-validation (middle right) and on the holdout sample (right) for HLA-DP. The green line indicates the calibration threshold.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF7" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;7</label>
<caption>
<p>HLA-DQ models. Left column shows the precision-recall curve for the trained model evaluated on the train sample (middle left), train sample in cross-validation (middle right) and on the holdout sample (right) for HLA-DQ. The green line indicates the calibration threshold.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF8" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;8</label>
<caption>
<p>HLA-DR models. Left column shows the precision-recall curve for the trained model evaluated on the train sample (middle left), train sample in cross-validation (middle right) and on the holdout sample (right) for HLA-DR. The green line indicates the calibration threshold.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF9" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;9</label>
<caption>
<p>TCRs specificity apparently independent of synonymous mutations in coding regions of HLAs. Number of TCR<italic>&#x3b2;</italic>s overlapping in two ES sets of HLAs differing only in their third field designation as a function of the FET p-value threshold used to identify ESs. The solid line shows the overlap in two sets of ESs identified using the three field designation to divide samples into two groups. Error bars are poisson uncertainties. Even if the TCR specificity is identical for HLAs differing only in their third field designation, we expect differences in the ES sets due to statistical fluctuations resulting from sampling. To account for this effect, we compare the observed overlap fraction when segregating samples by third field designation to a null distribution of overlap fractions derived from 100 realizations of two samples which are randomly divided irrespective of the third field designation. The two randomly divided samples in each realization are selected such that the relative size of the two samples matches the size of two samples split by the three field designation. Shaded regions indicate the distribution of the overlap fraction from these 100 realizations. Consistency between the overlap fraction of ESs derived from samples differing in their three field resolution and ones based on random permutation demonstrates that TCR specificity is independent of three field resolution for the two HLA allotypes tested.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Presentation1.pdf" id="SF10" mimetype="application/pdf">
<label>Supplementary Figure&#xa0;10</label>
<caption>
<p>We test the hypothesis that homozygosity at one loci increases breadth at another class matched loci. The distribution of zscores across class matched loci from a pairwise loci comparison. We calculate the zscore of the breadth at one loci in the case where another class matched loci is heterozygous or homozygous. We aggregate all pairwise comparisons for class I and class II separately.</p>
</caption>
</supplementary-material>
</sec>
<fn-group>
<fn id="fn1">
<label>1</label>
<p>
<ext-link ext-link-type="uri" xlink:href="http://hla.alleles.org/alleles/p_groups.html">http://hla.alleles.org/alleles/p_groups.html</ext-link>.</p>
</fn>
<fn id="fn2">
<label>2</label>
<p>Degenerate subunit pairs are indicatedby one of the degenerate subunits shown in parenthesis.</p>
</fn>
<fn id="fn3">
<label>3</label>
<p>F1 score is the harmonic mean of precision and recall and a useful metric of classification accuracy when there is large class imbalance such as the one we have for HLA imputation.</p>
</fn>
<fn id="fn4">
<label>4</label>
<p>We note that HLA-DR heterodimers are not subject to such pairing because the <italic>&#x3b1;</italic> chain is nearly invariable and thus these heterodimers behave similarly to class I HLAs.</p>
</fn>
<fn id="fn5">
<label>5</label>
<p>These data do not have sequencing based HLA typing.</p>
</fn>
<fn id="fn6">
<label>6</label>
<p>Our group has explored such analyses in disease contexts and found consistent results using TCR<italic>&#x3b1;</italic> or TCR<italic>&#x3b2;</italic> repertoires.</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hughes</surname> <given-names>AL</given-names>
</name>
<name>
<surname>Yeager</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Natural selection at major histocompatibility complex loci of vertebrates</article-title>. <source>Annu Rev Genet</source>. (<year>1998</year>) <volume>32</volume>:<page-range>415&#x2013;35</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.genet.32.1.415</pub-id>, PMID: <pub-id pub-id-type="pmid">9928486</pub-id></citation></ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zinkernagel</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Doherty</surname> <given-names>PC</given-names>
</name>
</person-group>. <article-title>Restriction of <italic>in vitro</italic> T cell-mediated cytotoxicity in lymphocytic choriomeningitis within a syngeneic or semiallogeneic system</article-title>. <source>Nature</source>. (<year>1974</year>) <volume>248</volume>:<page-range>701&#x2013;2</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/248701a0</pub-id>, PMID: <pub-id pub-id-type="pmid">4133807</pub-id></citation></ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Boniface</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Reich</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Lyons</surname> <given-names>D</given-names>
</name>
<name>
<surname>Hampl</surname> <given-names>J</given-names>
</name>
<name>
<surname>Arden</surname> <given-names>B</given-names>
</name>
<etal/>
</person-group>. <article-title>Ligand recognition by (alpha)(beta) T cell receptors</article-title>. <source>Annu Rev Immunol</source>. (<year>1998</year>) <volume>16</volume>:<fpage>523</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.immunol.16.1.523</pub-id>, PMID: <pub-id pub-id-type="pmid">9597140</pub-id></citation></ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martin</surname> <given-names>MP</given-names>
</name>
<name>
<surname>Carrington</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Immunogenetics of HIV disease</article-title>. <source>Immunol Rev</source>. (<year>2013</year>) <volume>254</volume>:<page-range>245&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/imr.12071</pub-id>, PMID: <pub-id pub-id-type="pmid">23772624</pub-id></citation></ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schumacher</surname> <given-names>TN</given-names>
</name>
<name>
<surname>Schreiber</surname> <given-names>RD</given-names>
</name>
</person-group>. <article-title>Neoantigens in cancer immunotherapy</article-title>. <source>Science</source>. (<year>2015</year>) <volume>348</volume>:<fpage>69</fpage>&#x2013;<lpage>74</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.aaa4971</pub-id>, PMID: <pub-id pub-id-type="pmid">25838375</pub-id></citation></ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Montgomery</surname> <given-names>RA</given-names>
</name>
<name>
<surname>Tatapudi</surname> <given-names>VS</given-names>
</name>
<name>
<surname>Leffell</surname> <given-names>MS</given-names>
</name>
<name>
<surname>Zachary</surname> <given-names>AA</given-names>
</name>
</person-group>. <article-title>HLA in transplantation</article-title>. <source>Nat Rev Nephrol</source>. (<year>2018</year>) <volume>14</volume>:<page-range>558&#x2013;70</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41581-018-0039-x</pub-id>, PMID: <pub-id pub-id-type="pmid">29985463</pub-id></citation></ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schumacher</surname> <given-names>TN</given-names>
</name>
<name>
<surname>Scheper</surname> <given-names>W</given-names>
</name>
<name>
<surname>Kvistborg</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Cancer neoantigens</article-title>. <source>Annu Rev Immunol</source>. (<year>2019</year>) <volume>37</volume>:<fpage>173</fpage>&#x2013;<lpage>200</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev-immunol-042617-053402</pub-id>, PMID: <pub-id pub-id-type="pmid">30550719</pub-id></citation></ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kovacs</surname> <given-names>AA</given-names>
</name>
<name>
<surname>Kono</surname> <given-names>N</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C-H</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>D</given-names>
</name>
<name>
<surname>Frederick</surname> <given-names>T</given-names>
</name>
<name>
<surname>Operskalski</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>Association of HLA genotype with T-cell activation in human immunodeficiency virus (HIV) and HIV/hepatitis C virus&#x2013;coinfected women</article-title>. <source>J Infect Dis</source>. (<year>2020</year>) <volume>221</volume>:<page-range>1156&#x2013;66</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/infdis/jiz589</pub-id>, PMID: <pub-id pub-id-type="pmid">31802115</pub-id></citation></ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Francis</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Leistritz-Edwards</surname> <given-names>D</given-names>
</name>
<name>
<surname>Dunn</surname> <given-names>A</given-names>
</name>
<name>
<surname>Tarr</surname> <given-names>C</given-names>
</name>
<name>
<surname>Lehman</surname> <given-names>J</given-names>
</name>
<name>
<surname>Dempsey</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Allelic variation in class I HLA determines CD8+ T cell repertoire shape and cross-reactive memory responses to SARS-CoV-2</article-title>. <source>Sci Immunol</source>. (<year>2021</year>) <volume>7</volume>:<elocation-id>eabk3070</elocation-id>., PMID: <pub-id pub-id-type="pmid">34793243</pub-id></citation></ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olafsdottir</surname> <given-names>TA</given-names>
</name>
<name>
<surname>Bjarnadottir</surname> <given-names>K</given-names>
</name>
<name>
<surname>Norddahl</surname> <given-names>GL</given-names>
</name>
<name>
<surname>Halldorsson</surname> <given-names>GH</given-names>
</name>
<name>
<surname>Melsted</surname> <given-names>P</given-names>
</name>
<name>
<surname>Gunnarsdottir</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>HLA alleles, disease severity, and age associate with T-cell responses following infection with SARS-CoV-2</article-title>. <source>Commun Biol</source>. (<year>2022</year>) <volume>5</volume>:<fpage>914</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s42003-022-03893-w</pub-id>, PMID: <pub-id pub-id-type="pmid">36068292</pub-id></citation></ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robinson</surname> <given-names>J</given-names>
</name>
<name>
<surname>Halliwell</surname> <given-names>JA</given-names>
</name>
<name>
<surname>McWilliam</surname> <given-names>H</given-names>
</name>
<name>
<surname>Lopez</surname> <given-names>R</given-names>
</name>
<name>
<surname>Parham</surname> <given-names>P</given-names>
</name>
<name>
<surname>Marsh</surname> <given-names>SG</given-names>
</name>
</person-group>. <article-title>The imgt/hla database</article-title>. <source>Nucleic Acids Res</source>. (<year>2012</year>) <volume>41</volume>:<page-range>D1222&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gks949</pub-id>, PMID: <pub-id pub-id-type="pmid">23080122</pub-id></citation></ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bjorkman</surname> <given-names>PJ</given-names>
</name>
<name>
<surname>Saper</surname> <given-names>M</given-names>
</name>
<name>
<surname>Samraoui</surname> <given-names>B</given-names>
</name>
<name>
<surname>Bennett</surname> <given-names>WS</given-names>
</name>
<name>
<surname>Strominger</surname> <given-names>Jt</given-names>
</name>
<name>
<surname>Wiley</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>Structure of the human class I histocompatibility antigen, HLA-A2</article-title>. <source>Nature</source>. (<year>1987</year>) <volume>329</volume>:<page-range>506&#x2013;12</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/329506a0</pub-id>, PMID: <pub-id pub-id-type="pmid">3309677</pub-id></citation></ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fremont</surname> <given-names>DH</given-names>
</name>
<name>
<surname>Matsumura</surname> <given-names>M</given-names>
</name>
<name>
<surname>Stura</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Peterson</surname> <given-names>PA</given-names>
</name>
<name>
<surname>Wilson</surname> <given-names>lA</given-names>
</name>
</person-group>. <article-title>Crystal structures of two viral peptides in complex with murine MHC class I H-2Kb</article-title>. <source>Science</source>. (<year>1992</year>) <volume>257</volume>:<page-range>919&#x2013;27</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1323877</pub-id>, PMID: <pub-id pub-id-type="pmid">1323877</pub-id></citation></ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Babbitt</surname> <given-names>BP</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>PM</given-names>
</name>
<name>
<surname>Matsueda</surname> <given-names>G</given-names>
</name>
<name>
<surname>Haber</surname> <given-names>E</given-names>
</name>
<name>
<surname>Unanue</surname> <given-names>ER</given-names>
</name>
</person-group>. <article-title>Binding of immunogenic peptides to Ia histocompatibility molecules</article-title>. <source>Nature</source>. (<year>1985</year>) <volume>317</volume>:<page-range>359&#x2013;61</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/317359a0</pub-id>, PMID: <pub-id pub-id-type="pmid">3876513</pub-id></citation></ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname> <given-names>JH</given-names>
</name>
<name>
<surname>Jardetzky</surname> <given-names>TS</given-names>
</name>
<name>
<surname>Gorga</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Stern</surname> <given-names>LJ</given-names>
</name>
<name>
<surname>Urban</surname> <given-names>RG</given-names>
</name>
<name>
<surname>Strominger</surname> <given-names>JL</given-names>
</name>
<etal/>
</person-group>. <article-title>Three-dimensional structure of the human class II histocompatibility antigen HLA-DR1</article-title>. <source>Nature</source>. (<year>1993</year>) <volume>364</volume>:<page-range>33&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/364033a0</pub-id>, PMID: <pub-id pub-id-type="pmid">8316295</pub-id></citation></ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fremont</surname> <given-names>DH</given-names>
</name>
<name>
<surname>Hendrickson</surname> <given-names>WA</given-names>
</name>
<name>
<surname>Marrack</surname> <given-names>P</given-names>
</name>
<name>
<surname>Kappler</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Structures of an MHC class II molecule with covalently bound single peptides</article-title>. <source>Science</source>. (<year>1996</year>) <volume>272</volume>:<page-range>1001&#x2013;4</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.272.5264.1001</pub-id>, PMID: <pub-id pub-id-type="pmid">8638119</pub-id></citation></ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marsh</surname> <given-names>SGE</given-names>
</name>
<name>
<surname>Albert</surname> <given-names>ED</given-names>
</name>
<name>
<surname>Bodmer</surname> <given-names>WF</given-names>
</name>
<name>
<surname>Bontrop</surname> <given-names>RE</given-names>
</name>
<name>
<surname>Dupont</surname> <given-names>B</given-names>
</name>
<name>
<surname>Erlich</surname> <given-names>HA</given-names>
</name>
<etal/>
</person-group>. <article-title>An update to HLA nomenclature, 2010</article-title>. <source>Bone Marrow Transplant</source>. (<year>2010</year>) <volume>45</volume>:<page-range>846&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/bmt.2010.79</pub-id>, PMID: <pub-id pub-id-type="pmid">20348972</pub-id></citation></ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sidney</surname> <given-names>J</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
<name>
<surname>Frahm</surname> <given-names>N</given-names>
</name>
<name>
<surname>Brander</surname> <given-names>C</given-names>
</name>
<name>
<surname>Sette</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>HLA class I supertypes: a revised and updated classification</article-title>. <source>BMC Immunol</source>. (<year>2008</year>) <volume>9</volume>:<fpage>1</fpage>&#x2013;<lpage>15</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2172-9-1</pub-id>, PMID: <pub-id pub-id-type="pmid">18211710</pub-id></citation></ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Apps</surname> <given-names>R</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Carlson</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>H</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Thomas</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Influence of HLA-C expression level on HIV control</article-title>. <source>Science</source>. (<year>2013</year>) <volume>340</volume>:<fpage>87</fpage>&#x2013;<lpage>91</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1232685</pub-id>, PMID: <pub-id pub-id-type="pmid">23559252</pub-id></citation></ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ramsuran</surname> <given-names>V</given-names>
</name>
<name>
<surname>Naranbhai</surname> <given-names>V</given-names>
</name>
<name>
<surname>Horowitz</surname> <given-names>A</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Martin</surname> <given-names>MP</given-names>
</name>
<name>
<surname>Yuki</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Elevated HLA-A expression impairs HIV control through inhibition of NKG2A-expressing cells</article-title>. <source>Science</source>. (<year>2018</year>) <volume>359</volume>:<fpage>86</fpage>&#x2013;<lpage>90</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.aam8825</pub-id>, PMID: <pub-id pub-id-type="pmid">29302013</pub-id></citation></ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martin</surname> <given-names>MP</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>J-H</given-names>
</name>
<name>
<surname>Nelson</surname> <given-names>GW</given-names>
</name>
<name>
<surname>Detels</surname> <given-names>R</given-names>
</name>
<name>
<surname>Goedert</surname> <given-names>JJ</given-names>
</name>
<etal/>
</person-group>. <article-title>Epistatic interaction between KIR3DS1 and HLA-B delays the progression to AIDS</article-title>. <source>Nat Genet</source>. (<year>2002</year>) <volume>31</volume>:<page-range>429&#x2013;34</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ng934</pub-id>, PMID: <pub-id pub-id-type="pmid">12134147</pub-id></citation></ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kloverpris</surname> <given-names>HN</given-names>
</name>
<name>
<surname>Cole</surname> <given-names>DK</given-names>
</name>
<name>
<surname>Fuller</surname> <given-names>A</given-names>
</name>
<name>
<surname>Carlson</surname> <given-names>J</given-names>
</name>
<name>
<surname>Beck</surname> <given-names>K</given-names>
</name>
<name>
<surname>Schauenburg</surname> <given-names>AJ</given-names>
</name>
<etal/>
</person-group>. <article-title>A molecular switch in immunodominant HIV-1-specific CD8 T-cell epitopes shapes differential HLA-restricted escape</article-title>. <source>Retrovirology</source>. (<year>2015</year>) <volume>12</volume>:<fpage>1</fpage>&#x2013;<lpage>11</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12977-015-0149-5</pub-id>, PMID: <pub-id pub-id-type="pmid">25808313</pub-id></citation></ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Illing</surname> <given-names>PT</given-names>
</name>
<name>
<surname>Pymm</surname> <given-names>P</given-names>
</name>
<name>
<surname>Croft</surname> <given-names>NP</given-names>
</name>
<name>
<surname>Hilton</surname> <given-names>HG</given-names>
</name>
<name>
<surname>Jojic</surname> <given-names>V</given-names>
</name>
<name>
<surname>Han</surname> <given-names>AS</given-names>
</name>
<etal/>
</person-group>. <article-title>HLA-B57 micropolymorphism defines the sequence and conformational breadth of the immunopeptidome</article-title>. <source>Nat Commun</source>. (<year>2018</year>) <volume>9</volume>:<fpage>4693</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-018-07109-w</pub-id>, PMID: <pub-id pub-id-type="pmid">30410026</pub-id></citation></ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carlson</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Listgarten</surname> <given-names>J</given-names>
</name>
<name>
<surname>Pfeifer</surname> <given-names>N</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>V</given-names>
</name>
<name>
<surname>Kadie</surname> <given-names>C</given-names>
</name>
<name>
<surname>Walker</surname> <given-names>BD</given-names>
</name>
<etal/>
</person-group>. <article-title>Widespread impact of HLA restriction on immune control and escape pathways of HIV-1</article-title>. <source>J Virol</source>. (<year>2012</year>) <volume>86</volume>:<page-range>5230&#x2013;43</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/JVI.06728-11</pub-id>, PMID: <pub-id pub-id-type="pmid">22379086</pub-id></citation></ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hedrick</surname> <given-names>SM</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>DI</given-names>
</name>
<name>
<surname>Nielsen</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Davis</surname> <given-names>MM</given-names>
</name>
</person-group>. <article-title>Isolation of Cdna clones encoding T cell-specific membrane-associated proteins</article-title>. <source>Nature</source>. (<year>1984</year>) <volume>308</volume>:<page-range>149&#x2013;53</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/308149a0</pub-id>, PMID: <pub-id pub-id-type="pmid">6199676</pub-id></citation></ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yanagi</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Yoshikai</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Leggett</surname> <given-names>K</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>SP</given-names>
</name>
<name>
<surname>Aleksander</surname> <given-names>I</given-names>
</name>
<name>
<surname>Mak</surname> <given-names>TW</given-names>
</name>
</person-group>. <article-title>A human T cell-specific cDNA clone encodes a protein having extensive homology to immunoglobulin chains</article-title>. <source>Nature</source>. (<year>1984</year>) <volume>308</volume>:<page-range>145&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/308145a0</pub-id>, PMID: <pub-id pub-id-type="pmid">6336315</pub-id></citation></ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fink</surname> <given-names>PJ</given-names>
</name>
<name>
<surname>Bevan</surname> <given-names>MJ</given-names>
</name>
</person-group>. <article-title>H-2 antigens of the thymus determinelymphocyte specificity</article-title>. <source>J Exp Med</source>. (<year>1978</year>) <volume>148</volume>:<page-range>766&#x2013;75</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1084/jem.148.3.766</pub-id>, PMID: <pub-id pub-id-type="pmid">308986</pub-id></citation></ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zinkernagel</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Callahan</surname> <given-names>GN</given-names>
</name>
<name>
<surname>Klein</surname> <given-names>J</given-names>
</name>
<name>
<surname>Dennert</surname> <given-names>G</given-names>
</name>
</person-group>. <article-title>Cytotoxic T cells learn specificity for self H&#x2013;2 during differentiation in the thymus</article-title>. <source>Nature</source>. (<year>1978</year>) <volume>271</volume>:<page-range>251&#x2013;3</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/271251a0</pub-id>, PMID: <pub-id pub-id-type="pmid">304527</pub-id></citation></ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Philpott</surname> <given-names>KL</given-names>
</name>
<name>
<surname>Viney</surname> <given-names>JL</given-names>
</name>
<name>
<surname>Kay</surname> <given-names>G</given-names>
</name>
<name>
<surname>Rastan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Gardiner</surname> <given-names>EM</given-names>
</name>
<name>
<surname>Chae</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Lymphoid development in mice congenitally lacking T cell receptor &#x3b1;&#x3b2;-expressing cells</article-title>. <source>Science</source>. (<year>1992</year>) <volume>256</volume>:<page-range>1448&#x2013;52</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1604321</pub-id>, PMID: <pub-id pub-id-type="pmid">1604321</pub-id></citation></ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huseby</surname> <given-names>ES</given-names>
</name>
<name>
<surname>White</surname> <given-names>J</given-names>
</name>
<name>
<surname>Crawford</surname> <given-names>F</given-names>
</name>
<name>
<surname>Vass</surname> <given-names>T</given-names>
</name>
<name>
<surname>Becker</surname> <given-names>D</given-names>
</name>
<name>
<surname>Pinilla</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>How the T cell repertoire becomes peptide and MHC specific</article-title>. <source>Cell</source>. (<year>2005</year>) <volume>122</volume>:<page-range>247&#x2013;60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2005.05.013</pub-id>, PMID: <pub-id pub-id-type="pmid">16051149</pub-id></citation></ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kisielow</surname> <given-names>P</given-names>
</name>
<name>
<surname>Teh</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Bl&#xa8;uthmann</surname> <given-names>H</given-names>
</name>
<name>
<surname>von Boehmer</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Positive selection of antigen-specific T cells in thymus by restricting MHC molecules</article-title>. <source>Nature</source>. (<year>1988</year>) <volume>335</volume>:<page-range>730&#x2013;3</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/335730a0</pub-id>, PMID: <pub-id pub-id-type="pmid">3262831</pub-id></citation></ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>von Boehmer</surname> <given-names>H</given-names>
</name>
<name>
<surname>Kisielow</surname> <given-names>P</given-names>
</name>
<name>
<surname>Kishi</surname> <given-names>H</given-names>
</name>
<name>
<surname>Scott</surname> <given-names>B</given-names>
</name>
<name>
<surname>Borgulya</surname> <given-names>P</given-names>
</name>
<name>
<surname>Teh</surname> <given-names>HS</given-names>
</name>
</person-group>. <article-title>The expression of CD4 and CD8 accessory molecules on mature T cells is not random but correlates with the specificity of the &#x3b1;&#x3b2; receptor for antigen</article-title>. <source>Immunol Rev</source>. (<year>1989</year>) <volume>109</volume>:<page-range>143&#x2013;52</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1600-065X.1989.tb00023.x</pub-id>, PMID: <pub-id pub-id-type="pmid">2475425</pub-id></citation></ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaye</surname> <given-names>J</given-names>
</name>
<name>
<surname>Hsu</surname> <given-names>M-L</given-names>
</name>
<name>
<surname>Sauron</surname> <given-names>M-E</given-names>
</name>
<name>
<surname>Jameson</surname> <given-names>SC</given-names>
</name>
<name>
<surname>Gascoigne</surname> <given-names>NR</given-names>
</name>
<name>
<surname>Hedrick</surname> <given-names>SM</given-names>
</name>
</person-group>. <article-title>Selective development of CD4+ T cells in transgenic mice expressing a class II MHC-restricted antigen receptor</article-title>. <source>Nature</source>. (<year>1989</year>) <volume>341</volume>:<page-range>746&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/341746a0</pub-id>, PMID: <pub-id pub-id-type="pmid">2571940</pub-id></citation></ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burnet</surname> <given-names>FM</given-names>
</name>
</person-group>. <article-title>A modification of jerne&#x2019;s theory of antibody production using the concept of clonal selection</article-title>. <source>CA: A Cancer J Clin</source>. (<year>1976</year>) <volume>26</volume>:<page-range>119&#x2013;21</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.3322/canjclin.26.2.119</pub-id>, PMID: <pub-id pub-id-type="pmid">816431</pub-id></citation></ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Emerson</surname> <given-names>RO</given-names>
</name>
<name>
<surname>DeWitt</surname> <given-names>WS</given-names>
</name>
<name>
<surname>Vignali</surname> <given-names>M</given-names>
</name>
<name>
<surname>Gravley</surname> <given-names>J</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>JK</given-names>
</name>
<name>
<surname>Osborne</surname> <given-names>EJ</given-names>
</name>
<etal/>
</person-group>. <article-title>Immunosequencing identifies signatures of cytomegalovirus exposure history and HLA-mediated effects on the T cell repertoire</article-title>. <source>Nat Genet</source>. (<year>2017</year>) <volume>49</volume>:<page-range>659&#x2013;65</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ng.3822</pub-id>, PMID: <pub-id pub-id-type="pmid">28369038</pub-id></citation></ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DeWitt</surname> <given-names>WS</given-names>
<suffix>III</suffix>
</name>
<name>
<surname>Smith</surname> <given-names>A</given-names>
</name>
<name>
<surname>Schoch</surname> <given-names>G</given-names>
</name>
<name>
<surname>Hansen</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Matsen</surname> <given-names>FA</given-names>
<suffix>IV</suffix>
</name>
<name>
<surname>Bradley</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Human T cell receptor occurrence patterns encode immune history, genetic background, and receptor specificity</article-title>. <source>Elife</source>. (<year>2018</year>) <volume>7</volume>:<fpage>e38358</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.7554/eLife.38358.043</pub-id>, PMID: <pub-id pub-id-type="pmid">30152754</pub-id></citation></ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Snyder</surname> <given-names>TM</given-names>
</name>
<name>
<surname>Gittelman</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Klinger</surname> <given-names>M</given-names>
</name>
<name>
<surname>May</surname> <given-names>DH</given-names>
</name>
<name>
<surname>Osborne</surname> <given-names>EJ</given-names>
</name>
<name>
<surname>Taniguchi</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Magnitude and dynamics of the T-cell response to SARS-CoV-2 infection at both individual and population levels</article-title>. <source>MedRxiv</source>. (<year>2020</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2020.07.31.20165647</pub-id>, PMID: <pub-id pub-id-type="pmid">32793919</pub-id></citation></ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Greissl</surname> <given-names>J</given-names>
</name>
<name>
<surname>Pesesky</surname> <given-names>M</given-names>
</name>
<name>
<surname>Dalai</surname> <given-names>SC</given-names>
</name>
<name>
<surname>Rebman</surname> <given-names>AW</given-names>
</name>
<name>
<surname>Soloski</surname> <given-names>MJ</given-names>
</name>
<name>
<surname>Horn</surname> <given-names>EJ</given-names>
</name>
<etal/>
</person-group>. <article-title>Immunosequencing of the T-cell receptor repertoire reveals signatures specific for diagnosis and characterization of early Lyme disease</article-title>. <source>medRxiv</source>. (<year>2021</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2021.07.30.21261353</pub-id>
</citation></ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bradley</surname> <given-names>P</given-names>
</name>
<name>
<surname>Thomas</surname> <given-names>PG</given-names>
</name>
</person-group>. <article-title>Using T cell receptor repertoires to understand the principles of adaptive immune recognition</article-title>. <source>Annu Rev Immunol</source>. (<year>2019</year>) <volume>37</volume>:<page-range>547&#x2013;70</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev-immunol-042718-041757</pub-id>, PMID: <pub-id pub-id-type="pmid">30699000</pub-id></citation></ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cowell</surname> <given-names>LG</given-names>
</name>
</person-group>. <article-title>The diagnostic, prognostic, and therapeutic potential of adaptive immune receptor repertoire profiling in cancerAdaptive immune receptor repertoire profiling in cancer</article-title>. <source>Cancer Res</source>. (<year>2020</year>) <volume>80</volume>:<page-range>643&#x2013;54</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/0008-5472.CAN-19-1457</pub-id>, PMID: <pub-id pub-id-type="pmid">31888887</pub-id></citation></ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arstila</surname> <given-names>TP</given-names>
</name>
<name>
<surname>Casrouge</surname> <given-names>A</given-names>
</name>
<name>
<surname>Baron</surname> <given-names>V</given-names>
</name>
<name>
<surname>Even</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kanellopoulos</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kourilsky</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>A direct estimate of the human &#x3b1;&#x3b2; T cell receptor diversity</article-title>. <source>Science</source>. (<year>1999</year>) <volume>286</volume>:<page-range>958&#x2013;61</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.286.5441.958</pub-id>, PMID: <pub-id pub-id-type="pmid">10542151</pub-id></citation></ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sewell</surname> <given-names>AK</given-names>
</name>
</person-group>. <article-title>Why must T cells be cross-reactive</article-title>? <source>Nat Rev Immunol</source>. (<year>2012</year>) <volume>12</volume>:<page-range>669&#x2013;77</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nri3279</pub-id>, PMID: <pub-id pub-id-type="pmid">22918468</pub-id></citation></ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ruiz Ortega</surname> <given-names>M</given-names>
</name>
<name>
<surname>Pogorelyy</surname> <given-names>MV</given-names>
</name>
<name>
<surname>Minervina</surname> <given-names>AA</given-names>
</name>
<name>
<surname>Thomas</surname> <given-names>PG</given-names>
</name>
<name>
<surname>Mora</surname> <given-names>T</given-names>
</name>
<name>
<surname>Walczak</surname> <given-names>AM</given-names>
</name>
</person-group>. <article-title>Learning predictive signatures of HLA type from T-cell repertoires</article-title>. <source>PloS Comput Biol</source>. (<year>2025</year>) <volume>21</volume>:<fpage>e1012724</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pcbi.1012724</pub-id>, PMID: <pub-id pub-id-type="pmid">39761303</pub-id></citation></ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>ElAbd</surname> <given-names>H</given-names>
</name>
<name>
<surname>Mahdy</surname> <given-names>AK</given-names>
</name>
<name>
<surname>Wacker</surname> <given-names>EM</given-names>
</name>
<name>
<surname>Gretsova</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ellinghaus</surname> <given-names>D</given-names>
</name>
<name>
<surname>Franke</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Decoding the restriction of T cell receptors to human leukocyte antigen alleles using statistical learning</article-title>. <source>bioRxiv</source>. (<year>2025</year>), <page-range>2025&#x2013;02</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2025.02.06.636910</pub-id>
</citation></ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carlson</surname> <given-names>CS</given-names>
</name>
<name>
<surname>Emerson</surname> <given-names>RO</given-names>
</name>
<name>
<surname>Sherwood</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Desmarais</surname> <given-names>C</given-names>
</name>
<name>
<surname>Chung</surname> <given-names>M-W</given-names>
</name>
<name>
<surname>Parsons</surname> <given-names>JM</given-names>
</name>
<etal/>
</person-group>. <article-title>Using synthetic templates to design an unbiased multiplex PCR assay</article-title>. <source>Nat&#xa0;Commun</source>. (<year>2013</year>) <volume>4</volume>:<fpage>1</fpage>&#x2013;<lpage>9</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ncomms3680</pub-id>, PMID: <pub-id pub-id-type="pmid">24157944</pub-id></citation></ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robins</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Immunosequencing: applications of immune repertoire deep sequencing</article-title>. <source>Curr Opin Immunol</source>. (<year>2013</year>) <volume>25</volume>:<page-range>646&#x2013;52</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.coi.2013.09.017</pub-id>, PMID: <pub-id pub-id-type="pmid">24140071</pub-id></citation></ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname> <given-names>AG</given-names>
</name>
<name>
<surname>Pereira</surname> <given-names>S</given-names>
</name>
<name>
<surname>Jaramillo</surname> <given-names>A</given-names>
</name>
<name>
<surname>Stoll</surname> <given-names>ST</given-names>
</name>
<name>
<surname>Khan</surname> <given-names>FM</given-names>
</name>
<name>
<surname>Berka</surname> <given-names>N</given-names>
</name>
<etal/>
</person-group>. <article-title>Comparison of sequence-specific oligonucleotide probe vs next generation sequencing for HLA-A, B, C, DRB1, DRB3/B4/B5, DQA1, DQB1, DPA1, and DPB1 typing: Toward single-pass high-resolution HLA typing in support of solid organ and hematopoietic cell transplant programs</article-title>. <source>Hla</source>. (<year>2019</year>) <volume>94</volume>:<fpage>296</fpage>&#x2013;<lpage>306</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/tan.13619</pub-id>, PMID: <pub-id pub-id-type="pmid">31237117</pub-id></citation></ref>
<ref id="B48">
<label>48</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lewontin</surname> <given-names>RC</given-names>
</name>
</person-group>. <source>The genetic basis of evolutionary change</source> Vol. <volume>560</volume>. . <publisher-loc>New York</publisher-loc>: <publisher-name>Columbia University Press</publisher-name> (<year>1974</year>).</citation></ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zarnitsyna</surname> <given-names>VI</given-names>
</name>
<name>
<surname>Evavold</surname> <given-names>BD</given-names>
</name>
<name>
<surname>Schoettle</surname> <given-names>LN</given-names>
</name>
<name>
<surname>Blattman</surname> <given-names>JN</given-names>
</name>
<name>
<surname>Antia</surname> <given-names>R</given-names>
</name>
</person-group>. <article-title>Estimating the diversity, completeness, and cross-reactivity of the T cell repertoire</article-title>. <source>Front Immunol</source>. (<year>2013</year>) <volume>4</volume>:<elocation-id>485</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fimmu.2013.00485</pub-id>, PMID: <pub-id pub-id-type="pmid">24421780</pub-id></citation></ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bentzen</surname> <given-names>AK</given-names>
</name>
<name>
<surname>Marquard</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Lyngaa</surname> <given-names>R</given-names>
</name>
<name>
<surname>Saini</surname> <given-names>SK</given-names>
</name>
<name>
<surname>Ramskov</surname> <given-names>S</given-names>
</name>
<name>
<surname>Donia</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>.&#xa0;<article-title>Large-scale detection of antigen-specific T cells using peptide-MHC-I multimers labeled with DNA barcodes</article-title>. <source>Nat Biotechnol</source>. (<year>2016</year>) <volume>34</volume>:<page-range>1037&#x2013;45</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nbt.3662</pub-id>, PMID: <pub-id pub-id-type="pmid">27571370</pub-id></citation></ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Glanville</surname> <given-names>J</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Nau</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hatton</surname> <given-names>O</given-names>
</name>
<name>
<surname>Wagar</surname> <given-names>LE</given-names>
</name>
<name>
<surname>Rubelt</surname> <given-names>F</given-names>
</name>
<etal/>
</person-group>. <article-title>Identifying specificity groups in the T cell receptor repertoire</article-title>. <source>Nature</source>. (<year>2017</year>) <volume>547</volume>:<page-range>94&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature22976</pub-id>, PMID: <pub-id pub-id-type="pmid">28636589</pub-id></citation></ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gittelman</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Lavezzo</surname> <given-names>E</given-names>
</name>
<name>
<surname>Snyder</surname> <given-names>TM</given-names>
</name>
<name>
<surname>Zahid</surname> <given-names>HJ</given-names>
</name>
<name>
<surname>Carty</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Elyanow</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Longitudinal analysis of T cell receptor repertoires reveals shared patterns of antigen-specific response to SARS-CoV-2 infection</article-title>. <source>JCI Insight</source>. (<year>2022</year>) <volume>7</volume>(<issue>10</issue>), <fpage>p.e151849</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1172/jci.insight.151849</pub-id>, PMID: <pub-id pub-id-type="pmid">35439174</pub-id></citation></ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Elyanow</surname> <given-names>R</given-names>
</name>
<name>
<surname>Snyder</surname> <given-names>TM</given-names>
</name>
<name>
<surname>Dalai</surname> <given-names>SC</given-names>
</name>
<name>
<surname>Gittelman</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Boonyaratanakornkit</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wald</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>T cell receptor sequencing identifies prior SARS-CoV-2 infection and correlates with neutralizing antibodies and disease severity</article-title>. <source>JCI Insight</source>. (<year>2022</year>) <volume>7</volume>(<issue>10</issue>), <fpage>p.e150070</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1172/jci.insight.150070</pub-id>, PMID: <pub-id pub-id-type="pmid">35439166</pub-id></citation></ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Macdonald</surname> <given-names>WA</given-names>
</name>
<name>
<surname>Purcell</surname> <given-names>AW</given-names>
</name>
<name>
<surname>Mifsud</surname> <given-names>NA</given-names>
</name>
<name>
<surname>Ely</surname> <given-names>LK</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>DS</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>A naturally selected dimorphism within the HLA-B44 supertype alters class I structure, peptide repertoire, and T cell recognition</article-title>. <source>J Exp Med</source>. (<year>2003</year>) <volume>198</volume>:<page-range>679&#x2013;91</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1084/jem.20030066</pub-id>, PMID: <pub-id pub-id-type="pmid">12939341</pub-id></citation></ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rossjohn</surname> <given-names>J</given-names>
</name>
<name>
<surname>Gras</surname> <given-names>S</given-names>
</name>
<name>
<surname>Miles</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Turner</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Godfrey</surname> <given-names>DI</given-names>
</name>
<name>
<surname>McCluskey</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>T cell antigen receptor recognition of antigen-presenting molecules</article-title>. <source>Annu Rev Immunol</source>. (<year>2015</year>) <volume>33</volume>:<fpage>169</fpage>&#x2013;<lpage>200</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev-immunol-032414-112334</pub-id>, PMID: <pub-id pub-id-type="pmid">25493333</pub-id></citation></ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carrington</surname> <given-names>M</given-names>
</name>
<name>
<surname>Nelson</surname> <given-names>GW</given-names>
</name>
<name>
<surname>Martin</surname> <given-names>MP</given-names>
</name>
<name>
<surname>Kissner</surname> <given-names>T</given-names>
</name>
<name>
<surname>Vlahov</surname> <given-names>D</given-names>
</name>
<name>
<surname>Goedert</surname> <given-names>JJ</given-names>
</name>
<etal/>
</person-group>. <article-title>HLA and HIV-1: heterozygote advantage and B* 35-Cw* 04 disadvantage</article-title>. <source>Science</source>. (<year>1999</year>) <volume>283</volume>:<page-range>1748&#x2013;52</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.283.5408.1748</pub-id>, PMID: <pub-id pub-id-type="pmid">10073943</pub-id></citation></ref>
<ref id="B57">
<label>57</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chowell</surname> <given-names>D</given-names>
</name>
<name>
<surname>Morris</surname> <given-names>LGT</given-names>
</name>
<name>
<surname>Grigg</surname> <given-names>CM</given-names>
</name>
<name>
<surname>Weber</surname> <given-names>JK</given-names>
</name>
<name>
<surname>Samstein</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Makarov</surname> <given-names>V</given-names>
</name>
<etal/>
</person-group>. <article-title>Patient HLA class I genotype influences cancer response to checkpoint blockade immunotherapy</article-title>. <source>Science</source>. (<year>2018</year>) <volume>359</volume>:<page-range>582&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.aao4572</pub-id>, PMID: <pub-id pub-id-type="pmid">29217585</pub-id></citation></ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Neefjes</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Ploegh</surname> <given-names>HL</given-names>
</name>
</person-group>. <article-title>Allele and locus-specific differences in cell surface expression and the association of HLA class I heavy chain with &#x3b2;2-microglobulin: differential effects of inhibition of glycosylation on class I subunit association</article-title>. <source>Eur J Immunol</source>. (<year>1988</year>) <volume>18</volume>:<page-range>801&#x2013;10</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/eji.1830180522</pub-id>, PMID: <pub-id pub-id-type="pmid">2967765</pub-id></citation></ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Choo</surname> <given-names>SY</given-names>
</name>
</person-group>. <article-title>The HLA system: genetics, immunology, clinical testing, and clinical implications</article-title>. <source>Yonsei Med J</source>. (<year>2007</year>) <volume>48</volume>:<fpage>11</fpage>&#x2013;<lpage>23</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3349/ymj.2007.48.1.11</pub-id>, PMID: <pub-id pub-id-type="pmid">17326240</pub-id></citation></ref>
<ref id="B60">
<label>60</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Braunstein</surname> <given-names>NS</given-names>
</name>
<name>
<surname>Germain</surname> <given-names>RN</given-names>
</name>
</person-group>. <article-title>Allele-specific control of Ia molecule surface expression and conformation: implications for a general model of Ia structurefunction relationships</article-title>. <source>Proc Natl Acad Sci</source>. (<year>1987</year>) <volume>84</volume>:<page-range>2921&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.84.9.2921</pub-id>, PMID: <pub-id pub-id-type="pmid">3033670</pub-id></citation></ref>
<ref id="B61">
<label>61</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kwok</surname> <given-names>WW</given-names>
</name>
<name>
<surname>Nepom</surname> <given-names>GT</given-names>
</name>
</person-group>. <article-title>Structural and functional constraints on HLA class&#xa0;II&#xa0;dimers implicated in susceptibility to insulin dependent diabetes mellitus</article-title>. <source>Bailliere&#x2019;s Clin Endocrinol Metab</source>. (<year>1991</year>) <volume>5</volume>:<page-range>375&#x2013;93</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0950-351X(05)80137-5</pub-id>, PMID: <pub-id pub-id-type="pmid">1716436</pub-id></citation></ref>
<ref id="B62">
<label>62</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tollefsen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hotta</surname> <given-names>K</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X</given-names>
</name>
<name>
<surname>Simonsen</surname> <given-names>B</given-names>
</name>
<name>
<surname>Swaminathan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Mathews</surname> <given-names>II</given-names>
</name>
<etal/>
</person-group>. <article-title>Structural and functional studies of trans-encoded HLA-DQ2. 3 (DQA1* 03: 01/DQB1* 02: 01) protein molecule</article-title>. <source>J Biol Chem</source>. (<year>2012</year>) <volume>287</volume>:<page-range>13611&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1074/jbc.M111.320374</pub-id>, PMID: <pub-id pub-id-type="pmid">22362761</pub-id></citation></ref>
<ref id="B63">
<label>63</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Slatkin</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Linkage disequilibrium&#x2014;understanding the evolutionary past&#xa0;and&#xa0;mapping the medical future</article-title>. <source>Nat Rev Genet</source>. (<year>2008</year>) <volume>9</volume>:<page-range>477&#x2013;85</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrg2361</pub-id>, PMID: <pub-id pub-id-type="pmid">18427557</pub-id></citation></ref>
<ref id="B64">
<label>64</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname> <given-names>SA</given-names>
</name>
<name>
<surname>Seale</surname> <given-names>SL</given-names>
</name>
<name>
<surname>Gittelman</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Rytlewski</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Robins</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Fields</surname> <given-names>PA</given-names>
</name>
</person-group>. <article-title>Impact of HLA type, age and chronic viral infection on peripheral T-cell receptor sharing between unrelated individuals</article-title>. <source>PloS One</source>. (<year>2021</year>) <volume>16</volume>:<fpage>e0249484</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0249484</pub-id>, PMID: <pub-id pub-id-type="pmid">34460826</pub-id></citation></ref>
<ref id="B65">
<label>65</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wooldridge</surname> <given-names>L</given-names>
</name>
<name>
<surname>Ekeruche-Makinde</surname> <given-names>J</given-names>
</name>
<name>
<surname>van den Berg</surname> <given-names>HA</given-names>
</name>
<name>
<surname>Skowera</surname> <given-names>A</given-names>
</name>
<name>
<surname>Miles</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>MP</given-names>
</name>
<etal/>
</person-group>. <article-title>A single autoimmune T cell receptor recognizes more than a million different peptides</article-title>. <source>J Biol Chem</source>. (<year>2012</year>) <volume>287</volume>:<page-range>1168&#x2013;77</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1074/jbc.M111.289488</pub-id>, PMID: <pub-id pub-id-type="pmid">22102287</pub-id></citation></ref>
<ref id="B66">
<label>66</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robins</surname> <given-names>HS</given-names>
</name>
<name>
<surname>Campregher</surname> <given-names>PV</given-names>
</name>
<name>
<surname>Srivastava</surname> <given-names>SK</given-names>
</name>
<name>
<surname>Wacher</surname> <given-names>A</given-names>
</name>
<name>
<surname>Turtle</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>Kahsai</surname> <given-names>O</given-names>
</name>
<etal/>
</person-group>. <article-title>Comprehensive assessment of T-cell receptor &#x3b2;-chain diversity in &#x3b1;&#x3b2; T cells</article-title>. <source>Blood</source>. (<year>2009</year>) <volume>114</volume>:<page-range>4099&#x2013;107</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1182/blood-2009-04-217604</pub-id>, PMID: <pub-id pub-id-type="pmid">19706884</pub-id></citation></ref>
<ref id="B67">
<label>67</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qi</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Glanville</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>D</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>J-Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Diversity and clonal selection in the human T-cell repertoire</article-title>. <source>Proc Natl Acad Sci</source>. (<year>2014</year>) <volume>111</volume>:<page-range>13139&#x2013;44</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1409155111</pub-id>, PMID: <pub-id pub-id-type="pmid">25157137</pub-id></citation></ref>
<ref id="B68">
<label>68</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murugan</surname> <given-names>A</given-names>
</name>
<name>
<surname>Mora</surname> <given-names>T</given-names>
</name>
<name>
<surname>Walczak</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Callan</surname> <given-names>CG</given-names>
</name>
</person-group>. <article-title>Statistical inference of the generation probability of T-cell receptors from sequence repertoires</article-title>. <source>Proc Natl Acad Sci</source>. (<year>2012</year>) <volume>109</volume>:<page-range>16161&#x2013;6</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1212755109</pub-id>, PMID: <pub-id pub-id-type="pmid">22988065</pub-id></citation></ref>
<ref id="B69">
<label>69</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yewdell</surname> <given-names>JW</given-names>
</name>
</person-group>. <article-title>Confronting complexity: real-world immunodominance in antiviral CD8+ T cell responses</article-title>. <source>Immunity</source>. (<year>2006</year>) <volume>25</volume>:<page-range>533&#x2013;43</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.immuni.2006.09.005</pub-id>, PMID: <pub-id pub-id-type="pmid">17046682</pub-id></citation></ref>
<ref id="B70">
<label>70</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>May</surname> <given-names>DH</given-names>
</name>
<name>
<surname>Woodhouse</surname> <given-names>S</given-names>
</name>
<name>
<surname>Zahid</surname> <given-names>HJ</given-names>
</name>
<name>
<surname>Elyanow</surname> <given-names>R</given-names>
</name>
<name>
<surname>Doroschak</surname> <given-names>K</given-names>
</name>
<name>
<surname>Noakes</surname> <given-names>MT</given-names>
</name>
<etal/>
</person-group>. <article-title>Identifying immune signatures of common exposures through co-occurrence of T-cell receptors in tens of thousands of donors</article-title>. <source>BioRxiv</source>. (<year>2024</year>), <page-range>2024&#x2013;03</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2024.03.26.583354</pub-id>
</citation></ref>
<ref id="B71">
<label>71</label>
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Chapfuwa</surname> <given-names>P</given-names>
</name>
<name>
<surname>Demirel</surname> <given-names>I</given-names>
</name>
<name>
<surname>Pisani</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zazo</surname> <given-names>J</given-names>
</name>
<name>
<surname>Portugaly</surname> <given-names>E</given-names>
</name>
<name>
<surname>Zahid</surname> <given-names>HJ</given-names>
</name>
<etal/>
</person-group>. , in: <conf-name>In The Thirteenth International Conference on Learning Representations</conf-name>, .</citation></ref>
<ref id="B72">
<label>72</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dines</surname> <given-names>JN</given-names>
</name>
<name>
<surname>Manley</surname> <given-names>TJ</given-names>
</name>
<name>
<surname>Svejnoha</surname> <given-names>E</given-names>
</name>
<name>
<surname>Simmons</surname> <given-names>HM</given-names>
</name>
<name>
<surname>Taniguchi</surname> <given-names>R</given-names>
</name>
<name>
<surname>Klinger</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>The immunerace study: A prospective multicohort study of immune response action to covid-19 events with the immunecode&#x2122; open access database</article-title>. <source>medRxiv</source>. (<year>2020</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2020.08.17.20175158</pub-id>
</citation></ref>
<ref id="B73">
<label>73</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>D</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>DG</given-names>
</name>
<name>
<surname>Ng</surname> <given-names>RH</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>K</given-names>
</name>
<name>
<surname>Choi</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Multiple early factors anticipate post-acute COVID-19 sequelae</article-title>. <source>Cell</source>. (<year>2022</year>) <volume>185</volume>:<page-range>881&#x2013;95</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2022.01.014</pub-id>, PMID: <pub-id pub-id-type="pmid">35216672</pub-id></citation></ref>
<ref id="B74">
<label>74</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fisher</surname> <given-names>RA</given-names>
</name>
</person-group>. <article-title>On the interpretation of &#x3c7; 2 from contingency tables, and the calculation of P</article-title>. <source>J R Stat Soc</source>. (<year>1922</year>) <volume>85</volume>:<fpage>87</fpage>&#x2013;<lpage>94</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2307/2340521</pub-id>
</citation></ref>
<ref id="B75">
<label>75</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Surh</surname> <given-names>CD</given-names>
</name>
<name>
<surname>Sprent</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Homeostasis of naive and memory T cells</article-title>. <source>Immunity</source>. (<year>2008</year>) <volume>29</volume>:<page-range>848&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.immuni.2008.11.002</pub-id>, PMID: <pub-id pub-id-type="pmid">19100699</pub-id></citation></ref>
</ref-list>
</back>
</article>