<?xml version="1.0" encoding="UTF-8"?>
<?covid-19-tdm?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Immunol.</journal-id>
<journal-title>Frontiers in Immunology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Immunol.</abbrev-journal-title>
<issn pub-type="epub">1664-3224</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fimmu.2021.669357</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Immunology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Influence of HLA Class II Polymorphism on Predicted Cellular Immunity Against SARS-CoV-2 at the Population and Individual Level</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Copley</surname>
<given-names>Hannah C.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1235396"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gragert</surname>
<given-names>Loren</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/698087"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Leach</surname>
<given-names>Andrew R.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1401182"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Kosmoliaptsis</surname>
<given-names>Vasilis</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/557897"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Surgery, Addenbrooke&#x2019;s Hospital, University of Cambridge</institution>, <addr-line>Cambridge</addr-line>, <country>United Kingdom</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>European Bioinformatics Institute (EMBL-EBI)</institution>, <addr-line>Cambridge</addr-line>, <country>United Kingdom</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Pathology, Tulane University School of Medicine</institution>, <addr-line>New Orleans, LA</addr-line>, <country>United States</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Bioinformatics Research, National Marrow Donor Program</institution>, <addr-line>Minneapolis, MN</addr-line>, <country>United States</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>National Institute of Health Research (NIHR) Blood and Transplant Research Unit in Organ Donation and Transplantation, University of Cambridge</institution>, <addr-line>Cambridge</addr-line>, <country>United Kingdom</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>NIHR Cambridge Biomedical Research Centre</institution>, <addr-line>Cambridge</addr-line>, <country>United Kingdom</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Yongqun Oliver He, University of Michigan, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Arman Bashirova, Leidos Biomedical Research, Inc., United States; Jennifer Ann Juno, The University of Melbourne, Australia; Grigory Efimov, National Research Center for Hematology, Russia</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Vasilis Kosmoliaptsis, <email xlink:href="mailto:vk256@cam.ac.uk">vk256@cam.ac.uk</email>
</p>
</fn>
<fn fn-type="other" id="fn002">
<p>This article was submitted to Viral Immunology, a section of the journal Frontiers in Immunology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>07</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>669357</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>02</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>28</day>
<month>06</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Copley, Gragert, Leach and Kosmoliaptsis</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Copley, Gragert, Leach and Kosmoliaptsis</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Development of adaptive immunity after COVID-19 and after vaccination against SARS-CoV-2 is predicated on recognition of viral peptides, presented on HLA class II molecules, by CD4+ T-cells. We capitalised on extensive high-resolution HLA data on twenty five human race/ethnic populations to investigate the role of HLA polymorphism on SARS-CoV-2 immunogenicity at the population and individual level. Within populations, we identify wide inter-individual variability in predicted peptide presentation from structural, non-structural and accessory SARS-CoV-2 proteins, according to individual HLA genotype. However, we find similar potential for anti-SARS-CoV-2 cellular immunity at the population level suggesting that HLA polymorphism is unlikely to account for observed disparities in clinical outcomes after COVID-19 among different race/ethnic groups. Our findings provide important insight on the potential role of HLA polymorphism on development of protective immunity after SARS-CoV-2 infection and after vaccination and a firm basis for further experimental studies in this field.</p>
</abstract>
<kwd-group>
<kwd>human leukocyte antigens</kwd>
<kwd>SARS-CoV-2</kwd>
<kwd>T-cells</kwd>
<kwd>cellular immunity</kwd>
<kwd>COVID-19</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="70"/>
<page-count count="13"/>
<word-count count="6652"/>
</counts>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>The new severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2), responsible for coronavirus disease 2019 (COVID-19), has caused an ongoing pandemic with 93,805,612 confirmed cases and 2,026,093 deaths worldwide [as of 19 January 2021 (<xref ref-type="bibr" rid="B1">1</xref>)]. Several risk factors for severe COVID-19 are now well-established, including age, gender, obesity and various co-morbidities such as diabetes, cancer and cardiovascular or chronic lung disease (<xref ref-type="bibr" rid="B2">2</xref>&#x2013;<xref ref-type="bibr" rid="B5">5</xref>). There is, however, an urgent need to better understand the role of race and ethnic differences on health outcomes. Several studies have highlighted a disproportionate prevalence of COVID-19 infections, higher rates of hospitalisation, and increased incidence of death in people from black and minority ethnic groups but the underlying reasons for these observations are not well understood (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B6">6</xref>&#x2013;<xref ref-type="bibr" rid="B8">8</xref>).</p>
<p>Even after accounting for well-known risk factors, there is still wide inter-individual clinical variability of COVID-19 outcomes within considered risk groups, which may reflect underlying genetic differences (<xref ref-type="bibr" rid="B9">9</xref>).The principal genetic region involved in immunity against viral pathogens is the Major Histocompatibility Complex encompassing the Human Leukocyte Antigen (HLA) loci. HLA class I (HLA-A, -B, -C) and HLA class II (HLA-DR, -DQ, -DP) proteins present viral peptides for recognition by CD8<sup>+</sup> and CD4<sup>+</sup> T-cells, respectively. The latter orchestrate adaptive anti-viral immunity and drive B-cell activation and maturation for robust humoral responses. Extensive polymorphism is observed in the HLA system, resulting in differences in HLA allele frequency both within and across human populations. HLA genotype can be a determining factor in development of protective immunity and, in turn, may account for part of the observed heterogeneity in measured immune responses and in clinical outcomes after SARS-CoV-2 infection (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B11">11</xref>). It is also well established that there is marked biological variation in how individuals respond and maintain immunity after vaccination which is, in part, attributable to genetic factors (<xref ref-type="bibr" rid="B12">12</xref>). It is, therefore, important to consider the role of HLA polymorphism when designing viral subunit or peptide vaccine formulations and in assessing population coverage and likelihood of immune protection after vaccination (<xref ref-type="bibr" rid="B13">13</xref>).</p>
<p>When considering the role of the HLA system in COVID-19 susceptibility and vaccine responses, it is essential to account for differences in HLA allele frequencies across human populations and, importantly, for the linkage disequilibrium between HLA loci that result in population-specific haplotype frequencies. Here, we utilise information on human HLA haplotype frequencies of twenty five human populations (four broad population categories and twenty one detailed population subcategories) at an unprecedented scale, capitalising on the extensive high-resolution HLA data deposited in the National Marrow Donor Program Registry, to compute population level immune responses against SARS-CoV-2 based on predicted high-affinity binding of viral proteome derived peptides by HLA class II molecules. Overall, we find similar potential for anti-SARS-CoV-2 cellular immunity across all populations examined suggesting that HLA polymorphism is unlikely to account for observed disparities in clinical outcomes after COVID-19 among different race and ethnic groups. However, within populations, we identify wide variability among individuals in predicted CD4<sup>+</sup> T-cell reactivity against structural, non-structural, and accessory SARS-CoV-2 proteins, according to HLA genotype. Nevertheless, we predict robust immune reactivity against the SARS-CoV-2 Spike protein, the basis for the majority of current vaccination efforts, both at the population and at the individual level.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<title>Materials And Methods</title>
<sec id="s2_1">
<title>Identification of Potential T-Cell Epitopes</title>
<p>Full viral proteome sequences for SARS-CoV-2 were downloaded from UniProt (<xref ref-type="bibr" rid="B14">14</xref>). FASTA-formatted protein sequence data for each protein and protein class were examined individually and in combination. We produced potential peptides of 15 amino acids length (15mers), using sliding windows over the entire proteome. Proteins of fewer than 15 amino acids in length were not examined. Analyses were performed considering proteins individually, some protein domains individually, and in groupings of proteins (both the whole proteome, and all structural, non-structural, and accessory proteins).</p>
</sec>
<sec id="s2_2">
<title>HLA and Haplotype Frequency Computation</title>
<p>HLA population frequencies were obtained from US unrelated stem cell donor registry National Marrow Donor Program (NMDP)/Be The Match. High resolution HLA Class II haplotype frequencies (DRB1, DRB3/4/5, DQA1, DQB1, DPA1 and DPB1 loci) were estimated using an expectation-maximization algorithm [as described by Gragert et&#xa0;al., 2013 (<xref ref-type="bibr" rid="B15">15</xref>)] utilising a cohort of 8.9 million US volunteer donors (NMDP/Be The Match registry snapshot 29/05/2020) HLA typed by molecular methods (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref> showing number of individuals genotyped). US population categories were developed based on a race/ethnicity questionnaire included on the donor consent form. There were four broad population categories (European American, African American, Asian or Pacific Islander and Hispanic) and 21 detailed populations subcategories (African American, African Black, South Asian Indian, American Indian - South or Central American, Alaska native of Aleut, North American Indian, Caribbean Black, Caribbean Hispanic, Caribbean Indian, European Caucasian, Filipino, Hawaiian or other Pacific Islander, Japanese, Korean, Middle Eastern or North Coast of Africa, Mexican or Chicano, Chinese, Hispanic - South or Central American, Black - South or Central American, Southeast Asian, Vietnamese). Some individuals were assigned only membership of a broad population category.</p>
<p>Following Hardy-Weinberg equilibrium proportions, multi-locus HLA Class II genotypes were generated by randomly sampling two haplotypes from the same population HLA haplotype frequency distribution. Simulated genotypes were generated for each of the four broad and 21 detailed population groups, with ten replicates at each population of size 1,000, 5,000 and 10,000.</p>
<p>For population-based analyses at the haplotype level, we analysed haplotypes up to 99% cumulative coverage within each population. HLA alleles, when examined individually, included all HLA alleles present in any of these selected haplotypes for the four broad and 21 detailed population groups.</p>
</sec>
<sec id="s2_3">
<title>Predicted T-Cell Epitope Identification</title>
<p>Peptide binding affinity was assessed for all Class II HLA that featured in haplotypes in any of the ethnic populations studied using NetMHCIIpan v4.0 (<xref ref-type="bibr" rid="B16">16</xref>). Peptides were examined both for their predicted binding affinity (nM) and their percentage rank (compared to a pool of representative peptides for the corresponding HLA). Peptides were defined as binders if their binding affinity was equal to or less than 500nM and their percentage rank was equal to or greater than 2% (default parameter for strong HLA class II peptide binders). Within the 9,590 15-mer peptides in the entire SARS-CoV-2 proteome, 4,289 peptides were predicted to bind strongly to one or more HLA Class II molecule. Analyses were also performed using alternative binding threshold cut-offs of &#x2264;50nM peptide binding affinity threshold and &#x2264;0.5% percentage rank in combination with a &#x2264;500nM peptide binding affinity threshold. The NetMHCIIpan-4.0 programme also identifies the predicted 9-mer binding core. Of all HLA observed, on average 0.52% of haplotypes contained an HLA that was not in the list of 5,620 HLA available to run on NetMHCIIpan-4.0. Total predicted peptide counts for an individual HLA per protein or per whole proteome were calculated by counting peptides only if they were both unique to one another (i.e., a unique 15-mer), but also if the predicted binding core (9-mer) was also unique. This prevented the count from appearing falsely elevated due to sequential overlapping peptides which were presenting the same core, by preventing them from being counted more than once. Total peptide counts (in the context of an HLA haplotype or genotype) were also enumerated from peptides with both unique 15-mers and 9-mer cores, from binding peptides presented in any Class II HLA within the haplotype or genotype.</p>
</sec>
<sec id="s2_4">
<title>Quantification and Statistical Analysis</title>
<p>Peptide-HLA scoring models were assessed using scikit-learn (<xref ref-type="bibr" rid="B17">17</xref>) in Python, specifically using sklearn.metrics.roc_auc_score (AUROC), sklearn.metrics.average_precision_score (Average Precision), sklearn.metrics.accuracy_score (Accuracy), and sklearn.metrics.classification_report (Sensitivity and Specificity) functions (see <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S3</bold>
</xref>, with n=93 for peptide-HLA combinations). In order to assess AUROC for two predictor variables, a composite predictor was calculated consisting of the normalised sum of both. Population comparisons of peptide scores were performed by calculating the mean and standard deviation using NumPy in Python (see <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S4</bold>
</xref>, N=10,000 individuals in simulated population groups). Population simulations were assessed for normality using statistics.shaipro (Shapiro-Wilk test) and following demonstration of non-normality for all distributions examined, with statistics.kruskal (Kruskal&#x2013;Wallis one-way analysis of variance) to assess differences between replicates of population simulations (all N=10,000), both implemented in Python.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Experimental Approach</title>
<p>The principal objective of our study was to examine whether genetic variation at the HLA loci may influence immune responses, and therefore COVID-19 clinical outcomes or response to vaccination, among patients from different ethnic populations. HLA class II molecules present peptides from exogenous antigens for CD4<sup>+</sup> T-cell recognition and are therefore critical components for an effective adaptive immune response that incorporates humoral (B-cell) and cytotoxic (CD8<sup>+</sup> T-cell) arms.</p>
<p>We analysed peptide binding for all classical HLA class II loci (HLA-DRB1, -DRB3/4/5, -DQA1, -DQB1, and -DPA1, -DPB1). The main analysis focused on four broad population categories, African Americans (AFA), European Caucasians (CAU), Hispanics (HIS) and Asian/Pacific Islanders (API) and sub-analysis included 21 detailed population subgroups of these broad categories. To account for linkage disequilibrium between HLA class II loci, we analysed HLA haplotypes rather than assuming allele frequencies were independent at each locus. HLA haplotype frequencies were estimated utilising HLA genotype data obtained from a cohort of approximately 8.9 million donors (NMDP/Be The Match registry; <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>). We analysed a total of 25,128 unique haplotypes to enable 99% coverage of each population which in turn required the analysis of 803 HLA class II molecules (see <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplemental Information</bold>
</xref>). <xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S1</bold>
</xref> depicts the number of distinct HLA-DRB1, -DRB345 alleles and HLA-DQA1/DQB1, DPA1/DPB1 heterodimers examined and associated haplotype coverage in each population. To confirm the robustness of our observations at the individual level, we analysed multiple replicate genotype samples and demonstrate with replicate sets of simulated genotypes of 10,000 individuals that HLA diversity, as measured by the alpha parameter fits to the power law distribution, was stable, and the number of unique haplotypes needed to reach 95% cumulative frequency was also stable across replicates (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S6</bold>
</xref>).</p>
<p>Immunogenic T-cell epitopes were identified using the full-length reference SARS-CoV-2 sequence (<xref ref-type="bibr" rid="B18">18</xref>) with 9,744 amino acids, which was subdivided into the four structural proteins (E, M, N, and S) and 7 additional open reading frames encoding non-structural proteins (NSP1-16) and accessory proteins (proteins 3a, 6, 7a, 7b, 8 and 10). A sliding window of 15 amino acids length was used and, to minimise redundancy, peptides were only counted towards totals if the HLA class II binding core was unique. To evaluate peptide binding and stable display by HLA class II molecules we employed NetMHCIIpan-4.0 which outputs predicted peptide-HLA binding affinity (IC50) in nanomolar units and percentile rank of binding affinity compared to a set of 100,000 random natural peptides. The percentile rank enables incorporation of information from the biological antigen presentation pathway in addition to the peptide-MHC binding event (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B19">19</xref>). We aimed to detect strongly binding peptides and, therefore, elected to use a threshold of &#x2264;2% percentile rank (default parameter for HLA class II strong peptide binding) combined with an affinity threshold &#x2264;500nM (<xref ref-type="bibr" rid="B16">16</xref>). To further increase the stringency of criteria for prediction of peptide binding, such that we maximise precision and reduce the rate of false positive peptides (accepting we may not recall all possible peptides that could be displayed), we also explored a model involving a threshold of &#x2264;0.5% percentage rank and &#x2264;500nM binding affinity. Finally, we examined a binding affinity threshold of &#x2264;50nM, as previously suggested (<xref ref-type="bibr" rid="B13">13</xref>). To validate the computational models we analysed publicly available datasets of experimentally determined, immunogenic SARS-CoV-2 peptides. We focused on the two largest datasets recently described by Snyder et&#xa0;al. (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>) and Nolan et&#xa0;al. (<xref ref-type="bibr" rid="B22">22</xref>) (250 HLA class II peptides) and by Mateus et&#xa0;al. (<xref ref-type="bibr" rid="B23">23</xref>) (135 HLA class II peptides) that contain peptides from the entire SARS-CoV-2 proteome. We also examined two relatively small datasets encompassing 9 nucleocapsid and 25 structural protein-derived (Spike, nucleocapsid or membrane) peptides (<xref ref-type="bibr" rid="B24">24</xref>, <xref ref-type="bibr" rid="B25">25</xref>). In the aforementioned datasets, the HLA restriction was not known and validation focused on positive identification of experimental peptides by the computational models (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplemental Information</bold>
</xref>). We also used an HLA-DRB1*04:01 restricted peptide dataset determined using an <italic>in vitro</italic> peptide-HLA stability assay (<xref ref-type="bibr" rid="B26">26</xref>). Our analyses showed that scoring peptide binding based on a combination of &#x2264;2% percentile rank and &#x2264;500nM binding affinity achieved the best true positive rate (sensitivity) for predicting experimentally derived SARS-CoV-2 peptides (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S2</bold>
</xref>). Similarly, in the HLA restricted dataset by Prachar et al, the combined &#x2264;2% percentile rank and &#x2264;500nM binding affinity threshold had an AUROC of 0.85 and provided the best combination of precision and specificity in classifying stable peptide binders compared to alternative scoring methods (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S3A</bold>
</xref>). Finally, we validated our approach using a recently published dataset of experimentally determined CD4<sup>+</sup> T-cell epitopes (<xref ref-type="bibr" rid="B27">27</xref>) and demonstrated that our approach does not introduce systematic bias across the studied populations and does not over-predict the number of immunogenic epitopes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S3B</bold>
</xref>). It should be noted that using a 50nM threshold, without accounting for binding characteristics of natural peptides, resulted in 46% of HLA alleles examined lacking presentation of any SARS-CoV-2 peptides and a bias towards HLA-DR as the major SARS-CoV-2 peptide presenting molecules (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S2</bold>
</xref>). Nevertheless, we have confirmed key aspects of our analyses using both a &#x2264;0.5% percentage rank in combination with a &#x2264;500nM peptide binding affinity threshold, and using a &#x2264;50nM peptide binding affinity threshold alone. Overall, a total of 9,590 15-mer peptides, derived from all 11 SARS-CoV-2 genes, were examined and 4,289 peptides were predicted to bind strongly according to our defined criteria to at least one HLA class II molecule.</p>
</sec>
<sec id="s3_2">
<title>SARS-CoV-2 Viral Proteome Presentation at the Molecular HLA Class II Level</title>
<p>We first examined presentation of viral epitopes by all HLA class II molecules contained in haplotypes representing 99% of the four major broad ethnic populations. Assessment of presentation capacity at the entire viral proteome level (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>) showed that the majority of HLA class II molecules are capable of presenting SARS-CoV-2 peptides, albeit with significant variability. HLA-DR alleles have the highest viral peptide presentation capacity followed by HLA-DP and, to a significantly lower extent, HLA-DQ molecules. Notably, certain common individual HLA molecules were predicted to have very limited ability to present viral peptides, including DQA1*03:01~DQB1*02:01 (no peptide presentation from any protein within the SARS-CoV-2 proteome; with frequency of 3.2% within AFA haplotypes, &lt;0.01% within API haplotypes, 0.1% within CAU haplotypes and 0.5% within HIS haplotypes), DRB1*03:02 (two peptides presented in total from the entire proteome; with frequency of 6.3% within AFA haplotypes, 0.01% within API haplotypes, 0.04% within CAU haplotypes and 1.0% within HIS haplotypes). Consistent with its known high immunogenicity (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B27">27</xref>&#x2013;<xref ref-type="bibr" rid="B31">31</xref>), Spike protein derived peptides showed strong binding for the majority of HLA class II molecules although presentation capacity again varied and was lowest (no peptides presented) for relatively common alleles such as DQA1*01:01~DQB1*05:03, with a frequency of 1.9-5.4% in each of the four broad population groups (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>). This observation was more prominent for Nucleocapsid derived peptides where strong binding was predicted to be absent in 117 out of 306 HLA molecules found in 99% of haplotypes in the four broad ethnic populations (mostly reflecting HLA-DP molecules and to some extent -DQ molecules; <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1C</bold>
</xref>). Similar findings were noted for the relatively small Membrane and Envelope structural proteins, with the latter predicted to be non-immunogenic for the majority of common HLA class II molecules (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1D, E</bold>
</xref>). For non-structural proteins, HLA class II presentation capacity was variable and dependent upon protein amino acid sequence length (data not shown).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>SARS-CoV-2 viral proteome presentation at the molecular HLA class II level. The number of viral peptides presented by individual HLA is shown for <bold>(A)</bold> the entire SARS-CoV-2 proteome; <bold>(B)</bold>. Spike protein (S protein); <bold>(C)</bold> Nucleocapsid protein (N protein); <bold>(D)</bold> Membrane protein (M protein); and <bold>(E)</bold> Envelope protein (E protein). The HLA frequency in four broad ethnic populations is shown (AFA, African Americans; API, Asian and Pacific Islanders; CAU, Caucasians; HIS, Hispanics). Bars are coloured according to HLA locus, as shown. HLA were included in the figure if they had a frequency of &#x2265; 1% in any haplotype distribution from the four broad population groups.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-669357-g001.tif"/>
</fig>
</sec>
<sec id="s3_3">
<title>SARS-CoV-2 Proteome Immunogenicity at the Population Level</title>
<p>The capacity of individuals to present viral peptides for recognition by CD4<sup>+</sup> T-cells depends on the composition of their HLA class II alleles in their inherited haplotypes. Given variation in population-specific HLA haplotype frequencies, we hypothesised that potential differences in SARS-CoV-2 proteome immunogenicity (as reflected by HLA class II peptide presentation) at the population level may reflect disparities in capacity for effective anti-SARS-CoV-2 immunity which could in turn influence response to vaccination or underpin observed variability in COVID-19 clinical outcomes among different ethnic populations. To investigate this hypothesis, we examined viral proteome presentation by HLA class II, accounting for the distribution of HLA haplotypes in a population. This analysis showed that the overall capacity for HLA peptide presentation, at the whole SARS-CoV-2 proteome level, among the four broad ethnic populations examined was remarkably similar (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). This was also the case considering T-cell epitopes from each SARS-CoV-2 protein (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S4</bold>
</xref>), suggesting that polymorphism at the HLA genomic region is unlikely to underpin potential differences in immune responses and, thus, in clinical outcomes among ethnic groups. It was notable, however, that within ethnic populations the capacity of individual HLA haplotypes to present viral peptides varied widely (data on HLA haplotypes examined and SARS-CoV-2 peptide presentation for the four broad ethnic populations is provided in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplemental Information</bold>
</xref>), with the top 5% of haplotypes predicted to present between 497 and 591 peptides from the entire viral proteome (such as DRB1*04:01~DRB4*01:01~DQA1*03:01~DQB1*03:01~DPA1* 01:03~DPB1*04:01 which represents 1% of AFA haplotypes, 0.14% of API haplotypes, 3.9% of CAU haplotypes and 0.9% of HIS haplotypes, predicted to present 506 SARS-CoV-2 peptides) as opposed to 5% of haplotypes at the opposite end of the spectrum predicted to present approximately 316 viral peptides or fewer (e.g. DRB1*03:01~DRB3*01:01~DQA1*05:01~DQB1* 02:01~DPA1*02:01~DPB1*01:01 which represents 0.25% of AFA haplotypes, 0.02% of API haplotypes, 3.5% of CAU haplotypes and 1.4% of HIS haplotypes, predicted to present 258 peptides). This observation suggests that individual capacity to mount CD4<sup>+</sup> T-cell immune responses against SARS-CoV-2 is not uniform and is likely dependent on HLA phenotype. Similar inter-individual variability was noted for peptide presentation derived from structural and from non-structural proteins as well as for distinct SARS-CoV-2 proteins examined (<xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2B&#x2013;E</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>S3</bold>
</xref>). Recent experimental studies suggested that up to 70% of CD4<sup>+</sup> T-cell responses against SARS-CoV-2 target the Spike, Membrane and Nucleocapsid antigens (<xref ref-type="bibr" rid="B10">10</xref>); our analysis showed the predicted CD4<sup>+</sup> T-cell response to these structural proteins is highly variable at the haplotype level (<xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2B&#x2013;D</bold>
</xref>). In agreement with the observed immunogenicity of Spike protein in experimental studies (<xref ref-type="bibr" rid="B28">28</xref>&#x2013;<xref ref-type="bibr" rid="B31">31</xref>), relatively high numbers of Spike-derived peptides were predicted to be recognised both within and across ethnic populations (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). In contrast, our analysis suggests that on average 13.9% of HLA haplotypes within each population have low capacity (&#x2264;2 peptides) to present Nucleocapsid-derived peptides (e.g. DRB1* 03:02~DRB3*01:01~DQA1*04:01~DQB1*04:02 ~DPA1*02:02~DPB1*01:01 which presents one peptide, and accounts for 4.98% of haplotypes found in AFA populations and 0.44% in HIS populations, although it is rare in API and CAU populations; <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2C</bold>
</xref>). This inter-individual variability may, in part, account for the heterogeneity in the presence and magnitude of CD4<sup>+</sup> T-cell and antibody responses against the Nucleocapsid protein noted in recent COVID-19 studies (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B32">32</xref>, <xref ref-type="bibr" rid="B33">33</xref>). Among non-structural viral proteins, our analysis suggested NSP3, NSP4 and NSP12 as the most immunogenic, in part reflecting their size, in each population (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S3</bold>
</xref>). The above noted similarity in overall capacity for SARS-CoV-2 peptide presentation among different populations was also observed at different (more stringent) thresholds for HLA-peptide binding, albeit with even higher individual variability within ethnic populations (500nM binding affinity and &#x2264;0.5% percentage rank or &#x2264;50nM binding affinity; <xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S4</bold>
</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>SARS-CoV-2 derived peptide presentation at the HLA haplotype level. Panels depict SARS-CoV-2 peptide presentation by HLA class II haplotypes representing 99% of total haplotypes within four broad population groups (African Americans, Asian Pacific Islanders, Caucasians and Hispanics). <bold>(A)</bold> Whole Proteome. <bold>(B)</bold> Spike protein (S protein). <bold>(C)</bold> Nucleocapsid protein (N protein). <bold>(D)</bold> Membrane protein (M protein). <bold>(E)</bold> Envelope protein (E protein). The width of each step in the curves is proportional to the relative frequency of a specific HLA haplotype.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-669357-g002.tif"/>
</fig>
<p>To further explore the consequences of the above observations at the individual level, and given that every individual expresses two HLA haplotypes, we generated 10 replicates each of random genotype datasets encompassing 1,000, 5,000 and 10,000 simulated individuals for each population, as described in the methods. Populations encompassing 10,000 individuals achieved &gt;95% cumulative HLA haplotype coverage in every population. As shown in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>, this analysis confirmed equivalent HLA class II presentation of SARS-CoV-2 peptides across all four broad ethnic populations, both at the entire viral proteome level and for individual proteins (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S4</bold>
</xref>). As noted for the HLA haplotype analysis, there was wide inter-individual variability in predicted potential for CD4<sup>+</sup> T-cell immune responses, according to HLA genotype. We noted significant, but variable, capacity for T-cell reactivity against the entire Spike glycoprotein across individuals, whereas reactivity against the Nucleocapsid protein was predicted to be weaker for 10% of individuals in each population, on average (range 7.8-13.3%, as defined by HLA presentation of less than 5 nucleocapsid peptides). These observations were confirmed (but, again, inter-individual variability was higher) using more stringent thresholds for defining HLA class II peptide presentation (data not shown). In further analysis, we considered immune reactivity against the Receptor Binding Domain (RBD) of Spike glycoprotein, as it represents a proposed target of coronavirus subunit vaccines currently in clinical trials (<xref ref-type="bibr" rid="B34">34</xref>&#x2013;<xref ref-type="bibr" rid="B36">36</xref>). Although, overall, there was no significant difference in predicted CD4<sup>+</sup> T-cell reactivity at the population level, there were notable differences at the individual level (both based on HLA haplotype and on genotype analyses) with wide variation in predicted RBD specific peptide presentation (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3F</bold>
</xref>). The above analyses were consistent irrespective of the size of the population sampled and among the 10 replicates at each population size (Kruskal-Wallis test p-value &gt;0.05 for peptide comparisons at the population level).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>SARS-CoV-2 derived peptide presentation at the HLA genotype level (broad population groups). Panels depict the number of SARS-CoV-2 peptides presented by individual HLA class II genotypes in simulated populations of 10,000 individuals for four broad population groups (African Americans, Asian Pacific Islanders, Caucasians and Hispanics). <bold>(A)</bold> Whole Proteome. <bold>(B)</bold> Spike protein (S protein). <bold>(C)</bold>. Nucleocapsid protein (N protein). <bold>(D)</bold> Membrane protein (M protein). <bold>(E)</bold> Envelope protein (E protein). <bold>(F)</bold> Receptor Binding Domain of Spike protein. The width of each step in the curves is proportional to the relative frequency of a specific HLA genotype. The boxplot charts depict the median, interquartile range (box) and range (whiskers - excluding outliers) for the number of viral peptides presented at the population level for each of the above ethnic groups.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-669357-g003.tif"/>
</fig>
<p>We next examined HLA class II presentation of SARS-CoV-2 peptides for a further 21 detailed population subgroups, as described above (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S5</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S4</bold>
</xref>). Overall, analysis of the entire viral proteome identified similar capacity for HLA class II viral peptide presentation across population subgroups. This was also the case for structural proteins, including Spike and RBD, mirroring the findings above for the broad population groups. Although we did not identify SARS-CoV-2 vulnerability of particular populations at the HLA level, again we observed inter-individual variation in predicted cellular immunity within ethnic groups. This was reflected in the range of predicted viral peptide presentation within simulated populations of 10,000 individuals including 24-112 for Spike, 4-25 for RBD, 1-24 for Nucleocapsid and 208-854 for the entire proteome (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S4</bold>
</xref>).</p>
</sec>
<sec id="s3_4">
<title>Immunogenicity Maps of SARS-CoV-2 Proteome at the Population Level</title>
<p>The effectiveness of peptide and subunit vaccine formulations against SARS-CoV-2 depends on robust presentation by individual HLA class II molecules and, therefore, investigated vaccines should account for linkage disequilibrium and HLA haplotype frequencies in different ethnic populations to achieve universal coverage. Capitalising on extensive HLA haplotype frequency data from the NMDP/Be The Match registry, we generated maps of SARS-CoV-2 immunogenicity for the entire viral proteome. This analysis showed that each viral protein contains immunogenic peptide segments with variable degree of population coverage which is, on the whole, similar across different populations for a given protein region, as well as peptide segments of variable length that are non-immunogenic in any population (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). Similar observations were made for coronavirus subunit components that are being investigated as potential vaccines with several immunogenic peptides predicted to achieve universal coverage across population groups (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). This was particularly evident for the Spike protein underlying its inherent immunogenicity and its potential as vaccination target. <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S5</bold>
</xref>, depicts SARS-CoV-2 immunogenic peptide segments predicted to cover over 90% of HLA genotypic variation in every broad ethnic group examined.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Immunogenicity maps of SARS-CoV-2 proteome at the population level. The panels depict the percentage of HLA class II genotypes, within populations of 10,000 individuals (AFA, African Americans; API, Asian Pacific Islanders; CAU, Caucasians and HIS, Hispanics), that are predicted to present individual SARS-CoV-2 peptides from <bold>(A)</bold>. Spike protein (S protein), S1, S2 and Receptor Binding Domain (RBD) are also shown; <bold>(B)</bold>. Nucleocapsid protein (N protein); <bold>(C)</bold>. Membrane protein (M protein); <bold>(D)</bold>. Envelope protein (E protein); and <bold>(E)</bold>. Open Reading Frame (ORF) 1ab polyprotein.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-12-669357-g004.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>Recognition of SARS-CoV-2 peptides in the context of HLA class II molecules is essential for CD4<sup>+</sup> T-cell activation and proliferation which, in turn, orchestrate the development of effector cellular (CD8<sup>+</sup> T-cell) and humoral adaptive immune responses after viral infection and after vaccination. In this computational study, we investigated the role of HLA on SARS-CoV-2 immunogenicity at the individual and at the population level, considering population-specific HLA allele, haplotype, and genotype frequencies. We accounted for genetic polymorphism and for HLA linkage disequilibrium in twenty five ethnic populations by capitalising on, to our knowledge, the most extensive HLA haplotype frequency information to date to predict SARS-CoV-2 specific CD4<sup>+</sup> T-cell epitopes covering the entire viral proteome. We find that the overall capacity for anti SARS-CoV-2 cellular immunity according to HLA class II genotype is similar at the population level across all ethnic groups examined. However, we identify wide inter-individual variability in predicted CD4<sup>+</sup> T-cell reactivity against every SARS-CoV-2 protein according to expressed HLA genotype. We predict robust immune reactivity against the SARS-CoV-2 Spike protein, the basis for the majority of current vaccination efforts, both at the population and at the individual level regardless of population origin. Finally, we provide comprehensive maps of SARS-CoV-2 proteome immunogenicity accounting for population coverage in ethnic groups.</p>
<p>Several recent studies have examined the cellular immune response to SARS-CoV-2 and revealed strong associations between the T-cell response and COVID-19 severity (<xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B37">37</xref>). Although this relationship is complex to untangle when the peripheral T-cell repertoire is sampled during the acute phase, it is notable that SARS-CoV-2 specific CD4<sup>+</sup> T-cells have been associated with lessened COVID-19 severity and that high frequency of Spike-specific CD4<sup>+</sup> T-cell responses were observed in patients who had recovered from COVID-19 (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B39">39</xref>). A coordinated and regulated response involving all branches of adaptive immunity (CD4<sup>+</sup>, CD8<sup>+</sup> and antibody responses) is likely required to reduce COVID-19 severity, with the cellular response being key for both initiating the adaptive response and for controlling the acute infection (<xref ref-type="bibr" rid="B29">29</xref>). Even though neutralising antibody titres are not predictive of disease severity (<xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B40">40</xref>), humoral responses are a key aspect of protective immunity after infection and critical for generating sterilising immunity after vaccination (<xref ref-type="bibr" rid="B34">34</xref>, <xref ref-type="bibr" rid="B41">41</xref>). In this respect, current evidence suggests a strong association between the magnitude of Spike-specific CD4<sup>+</sup> T-cells and neutralising antibody titres (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B38">38</xref>). Finally, the majority of recent literature on anti-SARS-CoV-2 immunity indicates there is a high degree of heterogeneity in the breadth and magnitude of both humoral and cellular responses to SARS-CoV-2 both at the individual patient level and in relation to specific viral proteins (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B42">42</xref>). Within this context, the observation that patients with severe COVID-19 had decreased diversity of T-cell responses suggested that recognition of multiple SARS-CoV-2 T-cell epitopes may be required for development of protective immunity after infection or after vaccination (<xref ref-type="bibr" rid="B43">43</xref>).</p>
<p>The above observations on anti-SARS-CoV-2 cellular immunity from experimental studies and the role of HLA in shaping the diversity of the T-cell repertoire (<xref ref-type="bibr" rid="B44">44</xref>, <xref ref-type="bibr" rid="B45">45</xref>), place the findings of our study into context. With regards to susceptibility to COVID-19, we hypothesised that genetic variation at the HLA complex may account for observed differences in clinical outcomes between ethnic groups (<xref ref-type="bibr" rid="B2">2</xref>, <xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B47">47</xref>). We performed a comprehensive analysis of HLA haplotypes and genotypes covering 99% of genetic HLA variation within twenty five ethnic populations and showed that the predicted CD4<sup>+</sup> T-cell response is overall remarkably similar at the population level both looking at the entire SARS-CoV-2 proteome and for individual viral proteins. This observation is supported by more nuanced recent investigations which show equivalent COVID-19 clinical outcomes after adjustment for potential socioeconomic and clinical confounders (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>). We did, however, find significant inter-individual variability in predicted SARS-CoV-2 proteome immunogenicity according to HLA phenotype. This variability was more pronounced for particular viral proteins, such as nucleocapsid, membrane protein and envelope protein and less evident when the entire viral proteome was considered where, even at the lower end of the spectrum, HLA haplotypes were predicted to present a significant number of CD4<sup>+</sup> T-cell epitopes. Given the relevance of diversity and magnitude of cellular immunity against SARS-CoV-2, as discussed above, it is tempting to speculate that HLA phenotype might underpin some of the observed inter-individual variability in COVID-19 outcomes, along with more established clinical factors. This might depend on the relative contribution of SARS-CoV-2 proteins to the quality of the immune response. For example, Grifoni et&#xa0;al. (<xref ref-type="bibr" rid="B10">10</xref>) have shown that up to 70% of CD4<sup>+</sup> T-cell responses against SARS-CoV-2 target the Spike, Membrane and Nucleocapsid antigens whereas significant reactivity was also noted against nsp3, nsp4 and ORF8. Despite significant differences between the highest and lowest peptide presenting HLA haplotypes, we noted substantial numbers of Spike-specific CD4<sup>+</sup> T-cell peptides presented by the majority of HLA haplotypes in all ethnic groups examined; in comparison, inter-individual variability according to HLA haplotype was more pronounced for the remaining of the above, and other, viral proteins. Whether this observation might translate into differential clinical outcomes or levels of protective immunity according to expressed HLA type would need to be examined in large clinical studies that encompass cohorts representative of the HLA polymorphism within particular populations. Certainly, evidence supporting an important role of HLA class II in viral immunity has been previously reported (<xref ref-type="bibr" rid="B48">48</xref>, <xref ref-type="bibr" rid="B49">49</xref>). The current SARS-CoV-2 pandemic represents a unique opportunity to address such fundamental questions which have recently started to be explored (<xref ref-type="bibr" rid="B50">50</xref>, <xref ref-type="bibr" rid="B51">51</xref>).</p>
<p>It is also well established that individual response, including efficacy and relative antibody levels, and maintenance of immunity after vaccination varies markedly and this biological variation results from a combination of environmental (such as age, size, sex, comorbid status, ethnicity, and dose and route of vaccine administration) and genetic factors (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B49">49</xref>). Non-responsiveness affects approximately 2-10% (and up to 20% following hepatitis B vaccination) of vaccinated healthy individuals (<xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B53">53</xref>). HLA class II haplotype plays a central role in the presentation of vaccine epitopes and is a known genetic risk factor for primary vaccination failure (<xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B54">54</xref>, <xref ref-type="bibr" rid="B55">55</xref>). Given that the majority of current vaccination efforts are focused on generating immunity against the Spike protein of SARS-CoV-2, we calculated the number of Spike-specific CD4<sup>+</sup> T-cell epitopes according to HLA genotype. Our analysis suggests that immune reactivity against Spike is likely to be robust both at the population level, including all 25 ethnic groups examined, and at the individual level. This finding is now supported experimentally by studies reporting high degree of seroconversion against Spike after natural infection and after vaccination (<xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B56">56</xref>&#x2013;<xref ref-type="bibr" rid="B61">61</xref>). Nevertheless, we noted inter-individual variation ranging from 112 peptides for the highest presenting HLA class II genotypes to 24 for the lowest. Whether such variation may affect the magnitude and diversity of protective immunity generated after vaccination requires further study but it is notable that variation in the degree of cellular immunity has been reported with a few vaccine formulations (<xref ref-type="bibr" rid="B57">57</xref>, <xref ref-type="bibr" rid="B60">60</xref>, <xref ref-type="bibr" rid="B62">62</xref>). To our knowledge, the relationship between HLA genotype, number of vaccine-derived T-cell epitopes and vaccine responsiveness has not been systematically examined yet, although this is the focus of current research efforts in the context of COVID-19.</p>
<p>It is important to acknowledge the limitations of our study. We used a computational approach to predict SARS-CoV-2 peptides presented by HLA class II molecules, however, peptide presentation does not always lead to CD4<sup>+</sup> T-cell activation; peptide recognition is complex and incompletely understood and is influenced by many factors, including relative expression of individual viral proteins (<xref ref-type="bibr" rid="B63">63</xref>). Nevertheless, NetMHCIIpan-4.0 is an established and validated algorithm for T-cell epitope prediction that has recently been updated resulting in improved performance (<xref ref-type="bibr" rid="B19">19</xref>). Recent computational studies investigating SARS-CoV-2 vaccine immunogenicity have based their approach for T-cell epitope selection exclusively on peptide-HLA binding affinity incorporating different thresholds (e.g. 500nM or 50nM) and identified population coverage gaps in predicted cellular immunity (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B64">64</xref>, <xref ref-type="bibr" rid="B65">65</xref>). This approach is affected by inherent bias of certain HLA molecules towards higher or lower mean predicted affinities; thus, we show that the 50nM binding affinity threshold, one of the most commonly used, is heavily biased towards HLA-DR as the main SARS-CoV-2 peptide presenting locus with the majority of HLA-DQ and -DP molecules showing no peptide binding. Accordingly, using a 50nM binding affinity threshold for defining peptide immunogenicity resulted in very wide inter-individual variability in predicted CD4<sup>+</sup> T-cell reactivity against SARS-CoV-2 proteins (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S4</bold>
</xref>). To overcome this limitation, we incorporated both binding affinity prediction and percentile rank, compared to a set of 100,000 random natural peptides, for epitope selection. The rank score normalizes prediction scores across different HLA molecules and enables interspecific HLA binding prediction comparisons; nevertheless, part of the difference in the peptide binding capacity of HLA molecules (highest for HLA-DR) in this study may reflect training of NetMHCIIpan-4.0 algorithm on peptide datasets that contain more information on HLA-DR restricted peptides. Notwithstanding that currently there is limited information on experimentally determined SARS-CoV-2 immunogenic T-cell epitopes and even less information on peptide HLA restriction, we have used available information in the published literature to validate our approach. We focused on prediction of strongly HLA binding peptides and demonstrated that our peptide selection threshold correctly identified the majority of experimentally determined immunogenic viral peptides in the largest published datasets (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B23">23</xref>). We also aimed to minimise the rate of false positive peptides and showed, in a limited experimental SARS-CoV-2 peptide dataset with HLA restrictions published by Prachar et al, that our 500nM binding affinity and &#x2264;2% rank threshold for peptide selection, achieves high precision and specificity (1.0 for both). Also, we confirmed that our observations on SARS-CoV-2 immunogenicity, both in relation to the comparison of population level responses and in relation to inter-individual variability, remained valid when we used more stringent peptide selection criteria (500nM and &#x2264;0.5% rank) and the commonly used 50nM binding affinity threshold. Finally, we used the NMDP/Be The Match registry to compute HLA population frequencies. In terms of population genetics, this study is limited in that the breadth of HLA diversity of global human populations is incompletely represented by the US population categories, and sampling depth varied widely among those categories included. However, the accuracy of US population HLA frequency estimates has been validated in multiple practical settings in transplantation, and HLA frequencies from many global population datasets from other stem cell registries often have high similarity with US population estimates (<xref ref-type="bibr" rid="B66">66</xref>&#x2013;<xref ref-type="bibr" rid="B68">68</xref>).</p>
<p>In conclusion, we present a rigorous immune-informatics approach to evaluate the potential for cellular immunity against SARS-CoV-2 at the population and at the individual level capitalising on, to our knowledge, the most comprehensive assessment of HLA genetic variation to date. Our findings provide important insight on the potential role of HLA polymorphism on development of protective immunity after SARS-CoV-2 infection and after vaccination and a firm basis for further experimental studies in this field.</p>
</sec>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The datasets generated and analysed for this study has been deposited in Mendeley Data: HLA haplotype population frequency data - US unrelated stem cell donor registry National Marrow Donor Program (NMDP) / Be The Match (<xref ref-type="bibr" rid="B69">69</xref>) and Data on HLA haplotypes examined and SARS-CoV-2 peptide presentation for the four broad ethnic populations (<xref ref-type="bibr" rid="B70">70</xref>). </p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>HC, VK, AL and LG contributed to definition of the central question and solutions. HC developed and implemented the peptide-HLA prediction models, the HLA, haplotype and population analysis and the algorithm validation with advice and supervision from AL and VK. LG performed the HLA population frequency computation, calculated the Haplotype frequency distributions, generated simulated populations and performed the statistical analysis on simulated populations. VK conceived and supervised the work and wrote the manuscript. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The research presented in this manuscript has received funding from the NIHR Blood and Transplant Research Unit in Organ Donation and Transplantation at the University of Cambridge, from the NIHR Cambridge Biomedical Research Centre and from an NIHR Fellowship (PDF-2016-09-065, VK). We gratefully acknowledge funding from an MRC Clinical Research Training Fellowship to HC (MR/S006745/1). VL acknowledges funding as a P.I. Terasaki Scholar. AL acknowledges funding by the Member States of the European Molecular Biology Laboratory (EMBL).</p>
</sec>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<ack>
<title>Acknowledgments</title>
<p>We thank the US Registry National Marrow Donor Program/Be The Match and the 38+ million stem cell registry volunteers worldwide. The views expressed are those of the authors and not necessarily those of the National Health Service, the National Institute for Health Research, the Department of Health, or National Health Service Blood and Transplant.</p>
</ack>
<sec id="s9" sec-type="supplementary-material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fimmu.2021.669357/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fimmu.2021.669357/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet_2.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="DataSheet_3.xlsx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="web">
<source>WHO_COVID-19_Dashboard</source>. Available at: <uri xlink:href="https://covid19.who.int/">https://covid19.who.int/</uri>.</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Williamson</surname> <given-names>EJ</given-names>
</name>
<name>
<surname>Walker</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>Bhaskaran</surname> <given-names>K</given-names>
</name>
<name>
<surname>Bacon</surname> <given-names>S</given-names>
</name>
<name>
<surname>Bates</surname> <given-names>C</given-names>
</name>
<name>
<surname>Morton</surname> <given-names>CE</given-names>
</name>
<etal/>
</person-group>. <article-title>Factors Associated With COVID-19-Related Death Using Opensafely</article-title>. <source>Nature</source> (<year>2020</year>) <volume>584</volume>:<fpage>430</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-020-2521-4</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grasselli</surname> <given-names>G</given-names>
</name>
<name>
<surname>Zangrillo</surname> <given-names>A</given-names>
</name>
<name>
<surname>Zanella</surname> <given-names>A</given-names>
</name>
<name>
<surname>Antonelli</surname> <given-names>M</given-names>
</name>
<name>
<surname>Cabrini</surname> <given-names>L</given-names>
</name>
<name>
<surname>Castelli</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Baseline Characteristics and Outcomes of 1591 Patients Infected With SARS-CoV-2 Admitted to ICUs of the Lombardy Region, Italy</article-title>. <source>JAMA</source> (<year>2020</year>) <volume>323</volume>:<fpage>1574</fpage>. doi: <pub-id pub-id-type="doi">10.1001/jama.2020.5394</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chow</surname> <given-names>N</given-names>
</name>
<name>
<surname>Fleming-Dutra</surname> <given-names>K</given-names>
</name>
<name>
<surname>Gierke</surname> <given-names>R</given-names>
</name>
<name>
<surname>Hall</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hughes</surname> <given-names>M</given-names>
</name>
<name>
<surname>Pilishvili</surname> <given-names>T</given-names>
</name>
<etal/>
</person-group>. <article-title>Preliminary Estimates of the Prevalence of Selected Underlying Health Conditions Among Patients with Coronavirus Disease 2019 - United States, February 12-March 28, 2020</article-title>. <source>MMWR Morbidity Mortality Weekly Rep</source> (<year>2020</year>) <volume>69</volume>:<fpage>382</fpage>. doi: <pub-id pub-id-type="doi">10.15585/mmwr.mm6913e2</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Richardson</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hirsch</surname> <given-names>JS</given-names>
</name>
<name>
<surname>Narasimhan</surname> <given-names>M</given-names>
</name>
<name>
<surname>Crawford</surname> <given-names>JM</given-names>
</name>
<name>
<surname>McGinn</surname> <given-names>T</given-names>
</name>
<name>
<surname>Davidson</surname> <given-names>KW</given-names>
</name>
<etal/>
</person-group>. <article-title>Presenting Characteristics, Comorbidities, and Outcomes Among 5700 Patients Hospitalized With Covid-19 in the New York City Area</article-title>. <source>JAMA</source> (<year>2020</year>) <volume>323</volume>:<fpage>2052</fpage>. doi: <pub-id pub-id-type="doi">10.1001/jama.2020.6775</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hsu</surname> <given-names>HE</given-names>
</name>
<name>
<surname>Ashe</surname> <given-names>EM</given-names>
</name>
<name>
<surname>Silverstein</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hofman</surname> <given-names>M</given-names>
</name>
<name>
<surname>Lange</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Razzaghi</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Race/Ethnicity, Underlying Medical Conditions, Homelessness, and Hospitalization Status of Adult Patients With COVID-19 at an Urban Safety-Net Medical Center - Boston, Massachusetts, 2020</article-title>. <source>MMWR Morbidity Mortality Weekly Rep</source> (<year>2020</year>) <volume>69</volume>:<fpage>864</fpage>. doi: <pub-id pub-id-type="doi">10.15585/mmwr.mm6927a3</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Price-Haywood</surname> <given-names>EG</given-names>
</name>
<name>
<surname>Burton</surname> <given-names>J</given-names>
</name>
<name>
<surname>Fort</surname> <given-names>D</given-names>
</name>
<name>
<surname>Seoane</surname> <given-names>L</given-names>
</name>
</person-group>. <article-title>Hospitalization and Mortality Among Black Patients and White Patients With Covid-19</article-title>. <source>N Engl J Med</source> (<year>2020</year>) <volume>382</volume>:<fpage>2534</fpage>. doi: <pub-id pub-id-type="doi">10.1056/NEJMsa2011686</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yehia</surname> <given-names>BR</given-names>
</name>
<name>
<surname>Winegar</surname> <given-names>A</given-names>
</name>
<name>
<surname>Fogel</surname> <given-names>R</given-names>
</name>
<name>
<surname>Fakih</surname> <given-names>M</given-names>
</name>
<name>
<surname>Ottenbacher</surname> <given-names>A</given-names>
</name>
<name>
<surname>Jesser</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Association of Race With Mortality Among Patients Hospitalized With Coronavirus Disease 2019 (Covid-19) at 92 US Hospitals</article-title>. <source>JAMA Network Open</source> (<year>2020</year>) <volume>3</volume>:<fpage>e2018039</fpage>. doi: <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.18039</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Bastard</surname> <given-names>P</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Le Pen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Moncada-Velez</surname> <given-names>M</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Inborn Errors of Type I IFN Immunity in Patients With Life-Threatening COVID-19</article-title>. <source>Science</source> (<year>2020</year>) <volume>370</volume>:<fpage>eabd4570</fpage>. doi: <pub-id pub-id-type="doi">10.1126/science.abd4570</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grifoni</surname> <given-names>A</given-names>
</name>
<name>
<surname>Weiskopf</surname> <given-names>D</given-names>
</name>
<name>
<surname>Ramirez</surname> <given-names>SI</given-names>
</name>
<name>
<surname>Mateus</surname> <given-names>J</given-names>
</name>
<name>
<surname>Dan</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Rydyznski Moderbacher</surname> <given-names>C</given-names>
</name>
<etal/>
</person-group>. <article-title>Targets of T Cell Responses to SARS-CoV-2 Coronavirus in Humans With COVID-19 Disease and Unexposed Individuals</article-title>. <source>Cell</source> (<year>2020</year>) <volume>181</volume>:<fpage>1489</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2020.05.015</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Staines</surname> <given-names>HM</given-names>
</name>
<name>
<surname>Kirwan</surname> <given-names>DE</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>DJ</given-names>
</name>
<name>
<surname>Adams</surname> <given-names>ER</given-names>
</name>
<name>
<surname>Augustin</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Byrne</surname> <given-names>RL</given-names>
</name>
<etal/>
</person-group>. <article-title>Igg Seroconversion and Pathophysiology in Severe Acute Respiratory Syndrome Coronavirus 2 Infection</article-title>. <source>Emerging Infect Dis</source> (<year>2021</year>) <volume>27</volume>:<fpage>85</fpage>. doi: <pub-id pub-id-type="doi">10.3201/eid2701.203074</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mentzer</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>O&#x2019;Connor</surname> <given-names>D</given-names>
</name>
<name>
<surname>Pollard</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>Hill</surname> <given-names>AVS</given-names>
</name>
</person-group>. <article-title>Searching for the Human Genetic Factors Standing in the Way of Universally Effective Vaccines</article-title>. <source>Philos Trans R Soc Lond B Biol Sci</source> (<year>2015</year>) <volume>370</volume>:<fpage>20140341</fpage>. doi: <pub-id pub-id-type="doi">10.1098/rstb.2014.0341</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Carter</surname> <given-names>B</given-names>
</name>
<name>
<surname>Bricken</surname> <given-names>T</given-names>
</name>
<name>
<surname>Jain</surname> <given-names>S</given-names>
</name>
<name>
<surname>Viard</surname> <given-names>M</given-names>
</name>
<name>
<surname>Carrington</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Computationally Optimized SARS-Cov-2 MHC Class I and II Vaccine Formulations Predicted to Target Human Haplotype Distributions</article-title>. <source>Cell Syst</source> (<year>2020</year>) <volume>11</volume>:<fpage>131</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cels.2020.06.009</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Consortium</surname> <given-names>TU</given-names>
</name>
</person-group>. <article-title>UniProt: A Worldwide Hub of Protein Knowledge</article-title>. <source>Nucleic Acids Res</source> (<year>2018</year>) <volume>47</volume>:<fpage>D506</fpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gky1049</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gragert</surname> <given-names>L</given-names>
</name>
<name>
<surname>Madbouly</surname> <given-names>A</given-names>
</name>
<name>
<surname>Freeman</surname> <given-names>J</given-names>
</name>
<name>
<surname>Maiers</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>Six-Locus High Resolution HLA Haplotype Frequencies Derived From Mixed-Resolution DNA Typing for the Entire US Donor Registry</article-title>. <source>Hum Immunol</source> (<year>2013</year>) <volume>74</volume>:<fpage>1313</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.humimm.2013.06.025</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reynisson</surname> <given-names>B</given-names>
</name>
<name>
<surname>Alvarez</surname> <given-names>B</given-names>
</name>
<name>
<surname>Paul</surname> <given-names>S</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
<name>
<surname>Nielsen</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>NetMHCpan-4.1 and NetMHCIIpan-4.0: Improved Predictions of MHC Antigen Presentation by Concurrent Motif Deconvolution and Integration of MS MHC Eluted Ligand Data</article-title>. <source>Nucleic Acids Res</source> (<year>2020</year>) <volume>48</volume>:<fpage>W449</fpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkaa379</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pedregosa</surname> <given-names>F</given-names>
</name>
<name>
<surname>Varoquaux</surname> <given-names>G</given-names>
</name>
<name>
<surname>Gramfort</surname> <given-names>A</given-names>
</name>
<name>
<surname>Michel</surname> <given-names>V</given-names>
</name>
<name>
<surname>Thirion</surname> <given-names>B</given-names>
</name>
<name>
<surname>Grisel</surname> <given-names>O</given-names>
</name>
<etal/>
</person-group>. <article-title>Scikit-Learn: Machine Learning in Python</article-title>. <source>J Mach Learn Res</source> (<year>2011</year>) <volume>12</volume>:<fpage>2825</fpage>. doi: <pub-id pub-id-type="doi">10.5555/1953048.2078195</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>C</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>M</given-names>
</name>
<name>
<surname>He</surname> <given-names>T</given-names>
</name>
<etal/>
</person-group>. <article-title>The Establishment of Reference Sequence for SARS-CoV-2 and Variation Analysis</article-title>. <source>J Med Virol</source> (<year>2020</year>) <volume>92</volume>:<fpage>667</fpage>. doi: <pub-id pub-id-type="doi">10.1002/jmv.25762</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reynisson</surname> <given-names>B</given-names>
</name>
<name>
<surname>Barra</surname> <given-names>C</given-names>
</name>
<name>
<surname>Kaabinejadian</surname> <given-names>S</given-names>
</name>
<name>
<surname>Hildebrand</surname> <given-names>WH</given-names>
</name>
<name>
<surname>Peters</surname> <given-names>B</given-names>
</name>
<name>
<surname>Nielsen</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Improved Prediction of MHC II Antigen Presentation Through Integration and Motif Deconvolution of Mass Spectrometry MHC Eluted Ligand Data</article-title>. <source>J Proteome Res</source> (<year>2020</year>) <volume>19</volume>:<fpage>2304</fpage>. doi: <pub-id pub-id-type="doi">10.1021/acs.jproteome.9b00874</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Snyder</surname> <given-names>TM</given-names>
</name>
<name>
<surname>Gittelman</surname> <given-names>RM</given-names>
</name>
<name>
<surname>Klinger</surname> <given-names>M</given-names>
</name>
<name>
<surname>May</surname> <given-names>DH</given-names>
</name>
<name>
<surname>Osborne</surname> <given-names>EJ</given-names>
</name>
<name>
<surname>Taniguchi</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Magnitude and Dynamics of the T-Cell Response to SARS-CoV-2 Infection at Both Individual and Population Levels</article-title>. <source>medRxiv Preprint Server Health Sci</source> (<year>2020</year>). doi: <pub-id pub-id-type="doi">10.1101/2020.07.31.20165647</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Carter</surname> <given-names>B</given-names>
</name>
<name>
<surname>Gifford</surname> <given-names>DK</given-names>
</name>
</person-group>. <article-title>Predicted Cellular Immunity Population Coverage Gaps for SARS-CoV-2 Subunit Vaccines and Their Augmentation by Compact Peptide Sets</article-title>. <source>Cell Syst</source> (<year>2021</year>) <page-range>102&#x2013;7</page-range>. doi: <pub-id pub-id-type="doi">10.1016/j.cels.2020.11.010</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nolan</surname> <given-names>S</given-names>
</name>
<name>
<surname>Vignali</surname> <given-names>M</given-names>
</name>
<name>
<surname>Klinger</surname> <given-names>M</given-names>
</name>
<name>
<surname>Dines</surname> <given-names>JN</given-names>
</name>
<name>
<surname>Kaplan</surname> <given-names>IM</given-names>
</name>
<name>
<surname>Svejnoha</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>A Large-Scale Database Of T-Cell Receptor Beta (Tcr&#x3b2;) Sequences And Binding Associations From Natural And Synthetic Exposure To Sars-Cov-2</article-title>. (<year>2020</year>). doi: <pub-id pub-id-type="doi">10.21203/rs.3.rs-51964/v1</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mateus</surname> <given-names>J</given-names>
</name>
<name>
<surname>Grifoni</surname> <given-names>A</given-names>
</name>
<name>
<surname>Tarke</surname> <given-names>A</given-names>
</name>
<name>
<surname>Sidney</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ramirez</surname> <given-names>SI</given-names>
</name>
<name>
<surname>Dan</surname> <given-names>JM</given-names>
</name>
<etal/>
</person-group>. <article-title>Selective and Cross-Reactive SARS-Cov-2 T Cell Epitopes in Unexposed Humans</article-title>. <source>Science</source> (<year>2020</year>) <volume>370</volume>:<fpage>89</fpage>. doi: <pub-id pub-id-type="doi">10.1126/science.abd3871</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le Bert</surname> <given-names>N</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>AT</given-names>
</name>
<name>
<surname>Kunasegaran</surname> <given-names>K</given-names>
</name>
<name>
<surname>Tham</surname> <given-names>CYL</given-names>
</name>
<name>
<surname>Hafezi</surname> <given-names>M</given-names>
</name>
<name>
<surname>Chia</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>SARS-Cov-2-Specific T Cell Immunity in Cases of COVID-19 and SARS, and Uninfected Controls</article-title>. <source>Nature</source> (<year>2020</year>) <volume>584</volume>:<fpage>457</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-020-2550-z</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Keller</surname> <given-names>MD</given-names>
</name>
<name>
<surname>Harris</surname> <given-names>KM</given-names>
</name>
<name>
<surname>Jensen-Wachspress</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Kankate</surname> <given-names>V</given-names>
</name>
<name>
<surname>Lang</surname> <given-names>H</given-names>
</name>
<name>
<surname>Lazarski</surname> <given-names>CA</given-names>
</name>
<etal/>
</person-group>. <article-title>SARS-Cov-2&#x2013;Specific T Cells Are Rapidly Expanded for Therapeutic Use and Target Conserved Regions of the Membrane Protein</article-title>. <source>Blood</source> (<year>2020</year>) <volume>136</volume>:<fpage>2905</fpage>. doi: <pub-id pub-id-type="doi">10.1182/blood.2020008488</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prachar</surname> <given-names>M</given-names>
</name>
<name>
<surname>Justesen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Steen-Jensen</surname> <given-names>DB</given-names>
</name>
<name>
<surname>Thorgrimsen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Jurgons</surname> <given-names>E</given-names>
</name>
<name>
<surname>Winther</surname> <given-names>O</given-names>
</name>
<etal/>
</person-group>. <article-title>Identification and Validation of 174 COVID-19 Vaccine Candidate Epitopes Reveals Low Performance of Common Epitope Prediction Tools</article-title>. <source>Sci Rep</source> (<year>2020</year>) <volume>10</volume>:<fpage>20465</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-020-77466-4</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tarke</surname> <given-names>A</given-names>
</name>
<name>
<surname>Sidney</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kidd</surname> <given-names>CK</given-names>
</name>
<name>
<surname>Dan</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Ramirez</surname> <given-names>SI</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>ED</given-names>
</name>
<etal/>
</person-group>. <article-title>Comprehensive Analysis of T Cell Immunodominance and Immunoprevalence of SARS-CoV-2 Epitopes in COVID-19 cases</article-title>. <source>Cell Rep Med</source> (<year>2021</year>) <volume>2</volume>(<issue>2</issue>):<fpage>100204</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.xcrm.2021.100204</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wajnberg</surname> <given-names>A</given-names>
</name>
<name>
<surname>Mansour</surname> <given-names>M</given-names>
</name>
<name>
<surname>Leven</surname> <given-names>E</given-names>
</name>
<name>
<surname>Bouvier</surname> <given-names>NM</given-names>
</name>
<name>
<surname>Patel</surname> <given-names>G</given-names>
</name>
<name>
<surname>Firpo-Betancourt</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Humoral Response and PCR Positivity in Patients With COVID-19 in the New York City Region, USA: An Observational Study</article-title>. <source>Lancet Microbe</source> (<year>2020</year>) <volume>1</volume>:<fpage>e283</fpage>. doi: <pub-id pub-id-type="doi">10.1016/S2666-5247(20)30120-8</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rydyznski Moderbacher</surname> <given-names>C</given-names>
</name>
<name>
<surname>Ramirez</surname> <given-names>SI</given-names>
</name>
<name>
<surname>Dan</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Grifoni</surname> <given-names>A</given-names>
</name>
<name>
<surname>Hastie</surname> <given-names>KM</given-names>
</name>
<name>
<surname>Weiskopf</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>Antigen-Specific Adaptive Immunity to SARS-CoV-2 in Acute Covid-19 and Associations With Age and Disease Severity</article-title>. <source>Cell</source> (<year>2020</year>) <volume>183</volume>:<fpage>996</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2020.09.038</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Juno</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>H-X</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>WS</given-names>
</name>
<name>
<surname>Reynaldi</surname> <given-names>A</given-names>
</name>
<name>
<surname>Kelly</surname> <given-names>HG</given-names>
</name>
<name>
<surname>Wragg</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>Humoral and Circulating Follicular Helper T Cell Responses in Recovered Patients With COVID-19</article-title>. <source>Nat Med</source> (<year>2020</year>) <volume>26</volume>:<fpage>1428</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41591-020-0995-0</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iyer</surname> <given-names>AS</given-names>
</name>
<name>
<surname>Jones</surname> <given-names>FK</given-names>
</name>
<name>
<surname>Nodoushani</surname> <given-names>A</given-names>
</name>
<name>
<surname>Kelly</surname> <given-names>M</given-names>
</name>
<name>
<surname>Becker</surname> <given-names>M</given-names>
</name>
<name>
<surname>Slater</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>Persistence and Decay of Human Antibody Responses to the Receptor Binding Domain of SARS-CoV-2 Spike Protein in COVID-19 Patients</article-title>. <source>Sci Immunol</source> (<year>2020</year>) <volume>5</volume>:<fpage>eabe0367</fpage>. doi: <pub-id pub-id-type="doi">10.1126/sciimmunol.abe0367</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Poll&#xe1;n</surname> <given-names>M</given-names>
</name>
<name>
<surname>P&#xe9;rez-G&#xf3;mez</surname> <given-names>B</given-names>
</name>
<name>
<surname>Pastor-Barriuso</surname> <given-names>R</given-names>
</name>
<name>
<surname>Oteo</surname> <given-names>J</given-names>
</name>
<name>
<surname>P&#xe9;rez-Olmeda</surname> <given-names>M</given-names>
</name>
<name>
<surname>Yotti</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Prevalence of SARS-CoV-2 in Spain (Ene-COVID): A Nationwide, Population-Based Seroepidemiological Study</article-title>. <source>Lancet</source> (<year>2020</year>) <volume>396</volume>:<fpage>535</fpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(20)32266-2</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dan</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Mateus</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kato</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Hastie</surname> <given-names>KM</given-names>
</name>
<name>
<surname>Dawen</surname> <given-names>E</given-names>
</name>
<name>
<surname>Faliti</surname> <given-names>CE</given-names>
</name>
<etal/>
</person-group>. <article-title>Immunological Memory to SARS-CoV-2 Assessed for Up to 8 Months After Infection</article-title>. <source>Science</source> (<year>2021</year>) <volume>371</volume>:<fpage>eabf4063</fpage>. doi: <pub-id pub-id-type="doi">10.1126/science.abf4063</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname> <given-names>J</given-names>
</name>
<name>
<surname>Tostanoski</surname> <given-names>LH</given-names>
</name>
<name>
<surname>Peter</surname> <given-names>L</given-names>
</name>
<name>
<surname>Mercado</surname> <given-names>NB</given-names>
</name>
<name>
<surname>McMahan</surname> <given-names>K</given-names>
</name>
<name>
<surname>Mahrokhian</surname> <given-names>SH</given-names>
</name>
<etal/>
</person-group>. <article-title>DNA Vaccine Protection Against SARS-CoV-2 in Rhesus Macaques</article-title>. <source>Science</source> (<year>2020</year>) <volume>369</volume>:<fpage>806</fpage>. doi: <pub-id pub-id-type="doi">10.1126/science.abc6284</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dai</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>T</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>K</given-names>
</name>
<name>
<surname>Han</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>L</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>A Universal Design of Betacoronavirus Vaccines against COVID-19, MERS, and SARS</article-title>. <source>Cell</source> (<year>2020</year>) <volume>182</volume>:<fpage>722</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2020.06.035</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Dai</surname> <given-names>T</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>M</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>F</given-names>
</name>
<etal/>
</person-group>. <article-title>A Systematic Review of SARS-CoV-2 Vaccine Candidates</article-title>. <source>Signal Transduction Targeted Ther</source> (<year>2020</year>) <volume>5</volume>:<fpage>237</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41392-020-00352-y</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vabret</surname> <given-names>N</given-names>
</name>
<name>
<surname>Britton</surname> <given-names>GJ</given-names>
</name>
<name>
<surname>Gruber</surname> <given-names>C</given-names>
</name>
<name>
<surname>Hegde</surname> <given-names>S</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kuksin</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Immunology of COVID-19: Current State of The Science</article-title>. <source>Immunity</source> (<year>2020</year>) <volume>52</volume>:<fpage>910</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.immuni.2020.05.002</pub-id>
</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Mentzer</surname> <given-names>AJ</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>X</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>Broad and Strong Memory CD4+ and CD8+ T Cells Induced by SARS-CoV-2 in UK Convalescent Individuals Following COVID-19</article-title>. <source>Nat Immunol</source> (<year>2020</year>) <volume>21</volume>:<fpage>1336</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41590-020-0782-6</pub-id>
</citation>
</ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sekine</surname> <given-names>T</given-names>
</name>
<name>
<surname>Perez-Potti</surname> <given-names>A</given-names>
</name>
<name>
<surname>Rivera-Ballesteros</surname> <given-names>O</given-names>
</name>
<name>
<surname>Str&#xe5;lin</surname> <given-names>K</given-names>
</name>
<name>
<surname>Gorin</surname> <given-names>JB</given-names>
</name>
<name>
<surname>Olsson</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Robust T Cell Immunity in Convalescent Individuals With Asymptomatic or Mild Covid-19</article-title>. <source>Cell</source> (<year>2020</year>) <volume>183</volume>:<fpage>158</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2020.08.017</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>M</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>QB</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>H</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Sui</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>Temporal Antibody Responses to SARS-CoV-2 in Patients of Coronavirus Disease 2019</article-title>. <source>Cell Discovery</source> (<year>2020</year>) <volume>6</volume>:<fpage>64</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41421-020-00209-2</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Corbett</surname> <given-names>KS</given-names>
</name>
<name>
<surname>Flynn</surname> <given-names>B</given-names>
</name>
<name>
<surname>Foulds</surname> <given-names>KE</given-names>
</name>
<name>
<surname>Francica</surname> <given-names>JR</given-names>
</name>
<name>
<surname>Boyoglu-Barnum</surname> <given-names>S</given-names>
</name>
<name>
<surname>Werner</surname> <given-names>AP</given-names>
</name>
<etal/>
</person-group>. <article-title>Evaluation of the mRNA-1273 Vaccine Against SARS-CoV-2 in Nonhuman Primates</article-title>. <source>New Engl J Med</source> (<year>2020</year>) <volume>383</volume>:<fpage>1544</fpage>. doi: <pub-id pub-id-type="doi">10.1056/NEJMoa2024671</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dan</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Mateus</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kato</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Hastie</surname> <given-names>KM</given-names>
</name>
<name>
<surname>Faliti</surname> <given-names>CE</given-names>
</name>
<name>
<surname>Ramirez</surname> <given-names>SI</given-names>
</name>
<etal/>
</person-group>. <article-title>Immunological Memory to SARS-CoV-2 Assessed for Greater Than Six Months After Infection</article-title>. <source>bioRxiv</source> (<year>2020</year>). doi: <pub-id pub-id-type="doi">10.1101/2020.11.15.383323</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nelde</surname> <given-names>A</given-names>
</name>
<name>
<surname>Bilich</surname> <given-names>T</given-names>
</name>
<name>
<surname>Heitmann</surname> <given-names>JS</given-names>
</name>
<name>
<surname>Maringer</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Salih</surname> <given-names>HR</given-names>
</name>
<name>
<surname>Roerden</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Sars-CoV-2-derived Peptides Define Heterologous and COVID-19-Induced T Cell Recognition</article-title>. <source>Nat Immunol</source> (<year>2021</year>) <volume>22</volume>:<fpage>74</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41590-020-00808-x</pub-id>
</citation>
</ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goldrath</surname> <given-names>AW</given-names>
</name>
<name>
<surname>Bevan</surname> <given-names>MJ</given-names>
</name>
</person-group>. <article-title>Selecting and Maintaining a Diverse T-Cell Repertoire</article-title>. <source>Nature</source> (<year>1999</year>) <volume>402</volume>:<fpage>255</fpage>. doi: <pub-id pub-id-type="doi">10.1038/46218</pub-id>
</citation>
</ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Messaoudi</surname> <given-names>I</given-names>
</name>
<name>
<surname>Guevara Pati&#xf1;o</surname> <given-names>JA</given-names>
</name>
<name>
<surname>Dyall</surname> <given-names>R</given-names>
</name>
<name>
<surname>LeMaoult</surname> <given-names>J</given-names>
</name>
<name>
<surname>Nikolich-&#x17d;ugich</surname> <given-names>J</given-names>
</name>
<etal/>
</person-group>. <article-title>Direct Link Between Mhc Polymorphism, T Cell Avidity, and Diversity in Immune Defense</article-title>. <source>Science</source> (<year>2002</year>) <volume>298</volume>:<fpage>1797</fpage>. doi: <pub-id pub-id-type="doi">10.1126/science.1076064</pub-id>
</citation>
</ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lassale</surname> <given-names>C</given-names>
</name>
<name>
<surname>Gaye</surname> <given-names>B</given-names>
</name>
<name>
<surname>Hamer</surname> <given-names>M</given-names>
</name>
<name>
<surname>Gale</surname> <given-names>CR</given-names>
</name>
<name>
<surname>Batty</surname> <given-names>GD</given-names>
</name>
<etal/>
</person-group>. <article-title>Ethnic Disparities in Hospitalisation for COVID-19 in England: The Role of Socioeconomic Factors, Mental Health, and Inflammatory and Pro-Inflammatory Factors in a Community-Based Cohort Study</article-title>. <source>Brain behav Immun</source> (<year>2020</year>) <volume>88</volume>:<fpage>44</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bbi.2020.05.074</pub-id>
</citation>
</ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aldridge</surname> <given-names>RW</given-names>
</name>
<name>
<surname>Lewer</surname> <given-names>D</given-names>
</name>
<name>
<surname>Katikireddi</surname> <given-names>SV</given-names>
</name>
<name>
<surname>Mathur</surname> <given-names>R</given-names>
</name>
<name>
<surname>Pathak</surname> <given-names>N</given-names>
</name>
<name>
<surname>Burns</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Black, Asian and Minority Ethnic Groups in England are at Increased Risk of Death From COVID-19: Indirect Standardisation of NHS Mortality Data</article-title>. <source>Wellcome Open Res</source> (<year>2020</year>) <volume>5</volume>:<fpage>88</fpage>. doi: <pub-id pub-id-type="doi">10.12688/wellcomeopenres.15922.1</pub-id>
</citation>
</ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname> <given-names>X</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>J</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>Strong Influence of Human Leukocyte Antigen (HLA)-DP Gene Variants on Development of Persistent Chronic Hepatitis B Virus Carriers in the Han Chinese Population</article-title>. <source>Hepatology</source> (<year>2011</year>) <volume>53</volume>:<fpage>422</fpage>. doi: <pub-id pub-id-type="doi">10.1002/hep.24048</pub-id>
</citation>
</ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Blackwell</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Jamieson</surname> <given-names>SE</given-names>
</name>
<name>
<surname>Burgner</surname> <given-names>D</given-names>
</name>
</person-group>. <article-title>HLA and Infectious Diseases</article-title>. <source>Clin Microbiol Rev</source> (<year>2009</year>) <volume>22</volume>:<fpage>370</fpage>. doi: <pub-id pub-id-type="doi">10.1128/CMR.00048-08</pub-id>
</citation>
</ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pisanti</surname> <given-names>S</given-names>
</name>
<name>
<surname>Deelen</surname> <given-names>J</given-names>
</name>
<name>
<surname>Gallina</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Caputo</surname> <given-names>M</given-names>
</name>
<name>
<surname>Citro</surname> <given-names>M</given-names>
</name>
<name>
<surname>Abate</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Correlation of the Two Most Frequent HLA Haplotypes in the Italian Population to the Differential Regional Incidence of Covid-19</article-title>. <source>J Trans Med</source> (<year>2020</year>) <volume>18</volume>:<fpage>352</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12967-020-02515-5</pub-id>
</citation>
</ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Langton</surname> <given-names>DJ</given-names>
</name>
<name>
<surname>Bourke</surname> <given-names>SC</given-names>
</name>
<name>
<surname>Lie</surname> <given-names>BA</given-names>
</name>
<name>
<surname>Reiff</surname> <given-names>G</given-names>
</name>
<name>
<surname>Natu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Darlay</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>The Influence Of Hla Genotype On Susceptibility To, And Severity Of, Covid-19 Infection</article-title>. <source>medRxiv</source> (<year>2021</year>). doi: <pub-id pub-id-type="doi">10.1101/2020.12.31.20249081</pub-id>
</citation>
</ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wiedermann</surname> <given-names>U</given-names>
</name>
<name>
<surname>Garner-Spitzer</surname> <given-names>E</given-names>
</name>
<name>
<surname>Wagner</surname> <given-names>A</given-names>
</name>
</person-group>. <article-title>Primary Vaccine Failure to Routine Vaccines: Why and What to do</article-title>? <source>Hum Vaccines Immunotherapeutics</source> (<year>2016</year>) <volume>12</volume>:<fpage>239</fpage>. doi: <pub-id pub-id-type="doi">10.1080/21645515.2015.1093263</pub-id>
</citation>
</ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kimman</surname> <given-names>TG</given-names>
</name>
<name>
<surname>Vandebriel</surname> <given-names>RJ</given-names>
</name>
<name>
<surname>Hoebee</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>Genetic Variation in the Response to Vaccination</article-title>. <source>Community Genet</source> (<year>2007</year>) <volume>10</volume>:<fpage>201</fpage>. doi: <pub-id pub-id-type="doi">10.1159/000106559</pub-id>
</citation>
</ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gelder</surname> <given-names>CM</given-names>
</name>
<name>
<surname>Lambkin</surname> <given-names>R</given-names>
</name>
<name>
<surname>Hart</surname> <given-names>KW</given-names>
</name>
<name>
<surname>Fleming</surname> <given-names>D</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>OM</given-names>
</name>
<name>
<surname>Bunce</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Associations Between Human Leukocyte Antigens and Nonresponsiveness to Influenza Vaccine</article-title>. <source>J Infect Dis</source> (<year>2002</year>) <volume>185</volume>:<fpage>114</fpage>. doi: <pub-id pub-id-type="doi">10.1086/338014</pub-id>
</citation>
</ref>
<ref id="B55">
<label>55</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Godkin</surname> <given-names>A</given-names>
</name>
<name>
<surname>Davenport</surname> <given-names>M</given-names>
</name>
<name>
<surname>Hill</surname> <given-names>AV</given-names>
</name>
</person-group>. <article-title>Molecular Analysis of HLA Class II Associations With Hepatitis B Virus Clearance and Vaccine Nonresponsiveness</article-title>. <source>Hepatology</source> (<year>2005</year>) <volume>41</volume>:<fpage>1383</fpage>. doi: <pub-id pub-id-type="doi">10.1002/hep.20716</pub-id>
</citation>
</ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gregoriadis</surname> <given-names>G</given-names>
</name>
</person-group>. <article-title>Liposomes In Therapeutic And Preventive Medicine: The Development Of The Drug-Carrier Concept</article-title>. <source>Ann NY Acad Sci</source> (<year>1978</year>) <volume>308</volume>:<fpage>343</fpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1749-6632.1978.tb22034.x</pub-id>
</citation>
</ref>
<ref id="B57">
<label>57</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anderson</surname> <given-names>EJ</given-names>
</name>
<name>
<surname>Rouphael</surname> <given-names>NG</given-names>
</name>
<name>
<surname>Widge</surname> <given-names>AT</given-names>
</name>
<name>
<surname>Jackson</surname> <given-names>LA</given-names>
</name>
<name>
<surname>Roberts</surname> <given-names>PC</given-names>
</name>
<name>
<surname>Makhene</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Safety and Immunogenicity of SARS-CoV-2 mRNA-1273 Vaccine in Older Adults</article-title>. <source>N Engl J Med</source> (<year>2020</year>) <volume>383</volume>:<fpage>2427</fpage>. doi: <pub-id pub-id-type="doi">10.1056/NEJMoa2028436</pub-id>
</citation>
</ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walsh</surname> <given-names>EE</given-names>
</name>
<name>
<surname>Frenck</surname> <given-names>RW</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Falsey</surname> <given-names>AR</given-names>
</name>
<name>
<surname>Kitchin</surname> <given-names>N</given-names>
</name>
<name>
<surname>Absalon</surname> <given-names>J</given-names>
</name>
<name>
<surname>Gurtman</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Safety and Immunogenicity of Two Rna-Based Covid-19 Vaccine Candidates</article-title>. <source>N Engl J Med</source> (<year>2020</year>) <volume>383</volume>:<fpage>2439</fpage>. doi: <pub-id pub-id-type="doi">10.1056/NEJMoa2027906</pub-id>
</citation>
</ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname> <given-names>F-C</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y-H</given-names>
</name>
<name>
<surname>Guan</surname> <given-names>X-H</given-names>
</name>
<name>
<surname>Hou</surname> <given-names>LH</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>WJ</given-names>
</name>
<name>
<surname>Li</surname> <given-names>JX</given-names>
</name>
<etal/>
</person-group>. <article-title>Safety, Tolerability, and Immunogenicity of a Recombinant Adenovirus Type-5 Vectored COVID-19 Vaccine: A Dose-Escalation, Open-Label, Non-Randomised, First-in-Human Trial</article-title>. <source>Lancet</source> (<year>2020</year>) <volume>395</volume>:<fpage>1845</fpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(20)31208-3</pub-id>
</citation>
</ref>
<ref id="B60">
<label>60</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ramasamy</surname> <given-names>MN</given-names>
</name>
<name>
<surname>Minassian</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Ewer</surname> <given-names>KJ</given-names>
</name>
<name>
<surname>Flaxman</surname> <given-names>AL</given-names>
</name>
<name>
<surname>Folegatti</surname> <given-names>PM</given-names>
</name>
<name>
<surname>Owens</surname> <given-names>DR</given-names>
</name>
<etal/>
</person-group>. <article-title>Safety and Immunogenicity of ChAdOx1 nCoV-19 Vaccine Administered in a Prime-Boost Regimen in Young and Old Adults (COV002): A Single-Blind, Randomised, Controlled, Phase 2/3 Trial</article-title>. <source>Lancet</source> (<year>2021</year>) <volume>396</volume>:<fpage>1979</fpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(20)32466-1</pub-id>
</citation>
</ref>
<ref id="B61">
<label>61</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Logunov</surname> <given-names>DY</given-names>
</name>
<name>
<surname>Dolzhikova</surname> <given-names>IV</given-names>
</name>
<name>
<surname>Zubkova</surname> <given-names>OV</given-names>
</name>
<name>
<surname>Tukhvatulin</surname> <given-names>AI</given-names>
</name>
<name>
<surname>Shcheblyakov</surname> <given-names>DV</given-names>
</name>
<name>
<surname>Dzharullaeva</surname> <given-names>AS</given-names>
</name>
<etal/>
</person-group>. <article-title>Safety and Immunogenicity of an rAd26 and rAd5 Vector-Based Heterologous Prime-Boost COVID-19 Vaccine in Two Formulations: Two Open, non-Randomised Phase 1/2 Studies From Russia</article-title>. <source>Lancet</source> (<year>2020</year>) <volume>396</volume>:<fpage>887</fpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(20)31866-3</pub-id>
</citation>
</ref>
<ref id="B62">
<label>62</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname> <given-names>F-C</given-names>
</name>
<name>
<surname>Guan</surname> <given-names>X-H</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y-H</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>JY</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>T</given-names>
</name>
<name>
<surname>Hou</surname> <given-names>LH</given-names>
</name>
<etal/>
</person-group>. <article-title>Immunogenicity and Safety of a Recombinant Adenovirus Type-5-Vectored COVID-19 Vaccine in Healthy Adults Aged 18 Years or Older: A Randomised, Double-Blind, Placebo-Controlled, Phase 2 Trial</article-title>. <source>Lancet</source> (<year>2020</year>) <volume>396</volume>:<fpage>479</fpage>. doi: <pub-id pub-id-type="doi">10.1016/S0140-6736(20)31605-6</pub-id>
</citation>
</ref>
<ref id="B63">
<label>63</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roche</surname> <given-names>PA</given-names>
</name>
<name>
<surname>Furuta</surname> <given-names>K</given-names>
</name>
</person-group>. <article-title>The Ins and Outs of MHC Class II-Mediated Antigen Processing and Presentation</article-title>. <source>Nat Rev Immunol</source> (<year>2015</year>) <volume>15</volume>:<fpage>203</fpage>. doi: <pub-id pub-id-type="doi">10.1038/nri3818</pub-id>
</citation>
</ref>
<ref id="B64">
<label>64</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yarmarkovich</surname> <given-names>M</given-names>
</name>
<name>
<surname>Warrington</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Farrel</surname> <given-names>A</given-names>
</name>
<name>
<surname>Maris</surname> <given-names>JM</given-names>
</name>
</person-group>. <article-title>Identification of SARS-CoV-2 Vaccine Epitopes Predicted to Induce Long-Term Population-Scale Immunity</article-title>. <source>Cell Rep Med</source> (<year>2020</year>) <volume>1</volume>(<issue>3</issue>):<fpage>100036</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.xcrm.2020.100036</pub-id>
</citation>
</ref>
<ref id="B65">
<label>65</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Behmard</surname> <given-names>E</given-names>
</name>
<name>
<surname>Soleymani</surname> <given-names>B</given-names>
</name>
<name>
<surname>Najafi</surname> <given-names>A</given-names>
</name>
<name>
<surname>Barzegari</surname> <given-names>E</given-names>
</name>
</person-group>. <article-title>Immunoinformatic Design of a COVID-19 Subunit Vaccine Using Entire Structural Immunogenic Epitopes of SARS-Cov-2</article-title>. <source>Sci Rep</source> (<year>2020</year>) <volume>10</volume>:<fpage>20864</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-020-77547-4</pub-id>
</citation>
</ref>
<ref id="B66">
<label>66</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gragert</surname> <given-names>L</given-names>
</name>
<name>
<surname>Eapen</surname> <given-names>M</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>E</given-names>
</name>
<name>
<surname>Freeman</surname> <given-names>J</given-names>
</name>
<name>
<surname>Spellman</surname> <given-names>S</given-names>
</name>
<name>
<surname>Baitty</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>HLA Match Likelihoods for Hematopoietic Stem-Cell Grafts in the U.S. Registry</article-title>. <source> N Engl J Med</source> (<year>2014</year>) <volume>371</volume>:<fpage>339</fpage>. doi: <pub-id pub-id-type="doi">10.1056/NEJMsa1311707</pub-id>
</citation>
</ref>
<ref id="B67">
<label>67</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simanovsky</surname> <given-names>AL</given-names>
</name>
<name>
<surname>Madbouly</surname> <given-names>A</given-names>
</name>
<name>
<surname>Halagan</surname> <given-names>M</given-names>
</name>
<name>
<surname>Maiers</surname> <given-names>M</given-names>
</name>
<name>
<surname>Louzoun</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Single Haplotype Admixture Models Using Large Scale HLA Genotype Frequencies to Reproduce Human Admixture</article-title>. <source>Immunogenetics</source> (<year>2019</year>) <volume>71</volume>:<fpage>589</fpage>. doi: <pub-id pub-id-type="doi">10.1007/s00251-019-01144-7</pub-id>
</citation>
</ref>
<ref id="B68">
<label>68</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Madbouly</surname> <given-names>A</given-names>
</name>
<name>
<surname>Gragert</surname> <given-names>L</given-names>
</name>
<name>
<surname>Freeman</surname> <given-names>J</given-names>
</name>
<name>
<surname>Leahy</surname> <given-names>N</given-names>
</name>
<name>
<surname>Gourraud</surname> <given-names>PA</given-names>
</name>
<name>
<surname>Hollenbach</surname> <given-names>JA</given-names>
</name>
<etal/>
</person-group>. <article-title>Validation of Statistical Imputation of Allele-Level Multilocus Phased Genotypes From Ambiguous HLA Assignments</article-title>. <source>Tissue Antigens</source> (<year>2014</year>) <volume>84</volume>:<fpage>285</fpage>. doi: <pub-id pub-id-type="doi">10.1111/tan.12390</pub-id>
</citation>
</ref>
<ref id="B69">
<label>69</label>
<citation citation-type="web">Available at: <uri xlink:href="https://data.mendeley.com/datasets/545r9cggzf/1">https://data.mendeley.com/datasets/545r9cggzf/1</uri>.</citation>
</ref>
<ref id="B70">
<label>70</label>
<citation citation-type="web">Available at: <uri xlink:href="https://data.mendeley.com/datasets/bjbw35cg35/1">https://data.mendeley.com/datasets/bjbw35cg35/1</uri>.</citation>
</ref>
</ref-list>
</back>
</article>