<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Immunol.</journal-id>
<journal-title>Frontiers in Immunology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Immunol.</abbrev-journal-title>
<issn pub-type="epub">1664-3224</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fimmu.2024.1359169</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Immunology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Unraveling the chicken T cell repertoire with enhanced genome annotation</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Fr&#xfc;h</surname>
<given-names>Simon P.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2607154"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Fr&#xfc;h</surname>
<given-names>Martin A.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kaufer</surname>
<given-names>Benedikt B.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/257760"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>G&#xf6;bel</surname>
<given-names>Thomas W.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/521843"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Veterinary Sciences, Ludwig-Maximilians-Universit&#xe4;t M&#xfc;nchen</institution>, <addr-line>Munich</addr-line>, <country>Germany</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Institute of Virology, Freie Universit&#xe4;t Berlin</institution>, <addr-line>Berlin</addr-line>, <country>Germany</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Independent Researcher</institution>, <addr-line>Munich</addr-line>, <country>Germany</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Michal Vinkler, Charles University, Czechia</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Guan-Jun Yang, Ningbo University, China</p>
<p>Magdalena Migalska, Jagiellonian University, Poland</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Thomas W. G&#xf6;bel, <email xlink:href="mailto:goebel@lmu.de">goebel@lmu.de</email>; Simon P. Fr&#xfc;h, <email xlink:href="mailto:s.frueh@lmu.de">s.frueh@lmu.de</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>14</day>
<month>03</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1359169</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>12</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>02</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Fr&#xfc;h, Fr&#xfc;h, Kaufer and G&#xf6;bel</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Fr&#xfc;h, Fr&#xfc;h, Kaufer and G&#xf6;bel</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>T cell receptor (TCR) repertoire sequencing has emerged as a powerful tool for understanding the diversity and functionality of T cells within the host immune system. Yet, the chicken TCR repertoire remains poorly understood due to incomplete genome annotation of the TCR loci, despite the importance of chickens in agriculture and as an immunological model. Here, we addressed this critical issue by employing 5&#x2019; rapid amplification of complementary DNA ends (5&#x2019;RACE) TCR repertoire sequencing with molecular barcoding of complementary DNA (cDNA) molecules. Simultaneously, we enhanced the genome annotation of TCR Variable (V), Diversity (D, only present in &#x3b2; and &#x3b4; loci) and Joining (J) genes in the chicken genome. To enhance the efficiency of TCR annotations, we developed <italic>VJ-gene-finder</italic>, an algorithm designed to extract VJ gene candidates from deoxyribonucleic acid (DNA) sequences. Using this tool, we achieved a comprehensive annotation of all known chicken TCR loci, including the &#x3b1;/&#x3b4; locus on chromosome 27. Evolutionary analysis revealed that each locus evolved separately by duplication of long homology units. To define the baseline TCR diversity in healthy chickens and to demonstrate the feasibility of the approach, we characterized the splenic &#x3b1;/&#x3b2;/&#x3b3;/&#x3b4; TCR repertoire. Analysis of the repertoires revealed preferential usage of specific V and J combinations in all chains, while the overall features were characteristic of unbiased repertoires. We observed moderate levels of shared complementarity-determining region 3 (CDR3) clonotypes among individual birds within the &#x3b1; and &#x3b3; chain repertoires, including the most frequently occurring clonotypes. However, the &#x3b2; and &#x3b4; repertoires were predominantly unique to each bird. Taken together, our TCR repertoire analysis allowed us to decipher the composition, diversity, and functionality of T cells in chickens. This work not only represents a significant step towards understanding avian T cell biology, but will also shed light on host-pathogen interactions, vaccine development, and the evolutionary history of avian immunology.</p>
</abstract>
<kwd-group>
<kwd>chicken</kwd>
<kwd>T cells</kwd>
<kwd>TCR &#x3b1;/&#x3b2;/&#x3b3;/&#x3b4; locus annotation</kwd>
<kwd>
<italic>VJ-gene-finder</italic>
</kwd>
<kwd>TCR repertoire sequencing</kwd>
<kwd>spleen</kwd>
</kwd-group>
<counts>
<fig-count count="9"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="80"/>
<page-count count="19"/>
<word-count count="10754"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Comparative Immunology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>The avian immune system plays a pivotal role in safeguarding poultry health, thereby contributing significantly to human food security. Among the various components of the avian immune system, T cells are instrumental in orchestrating adaptive immune responses. Cytotoxic cluster of differentiation (CD)8<sup>+</sup> T cells target infected or aberrant host cells, whereas CD4<sup>+</sup> T helper cells facilitate B cell functions and coordinate effector cells and molecules. In addition to &#x3b1;&#x3b2; T cells, &#x3b3;&#x3b4; T cells likely also play important roles in homeostasis and infection, but their functions are less well characterized and appear to comprise both innate and adaptive effector functions (<xref ref-type="bibr" rid="B1">1</xref>&#x2013;<xref ref-type="bibr" rid="B3">3</xref>). Monoclonal antibodies specific for major chicken T cell antigens CD3, CD4, CD8, TCR &#x3b3;&#x3b4; (clone TCR-1), TCR &#x3b1;&#x3b2; V&#x3b2;1 (clone TCR-2), TCR &#x3b1;&#x3b2; V&#x3b2;2 (clone TCR-3) have been available for more than 30 years (<xref ref-type="bibr" rid="B4">4</xref>&#x2013;<xref ref-type="bibr" rid="B9">9</xref>). Yet, a detailed understanding of the intricate dynamics of T cell responses in chickens remains elusive. Unraveling the complexities of T cell-mediated immunity requires analysis of T cells on the clonal level.</p>
<p>Clonal T cell populations express identical TCRs on their surface, leading to shared antigen-specificity. The TCR structure comprises either an &#x3b1; and a &#x3b2; chain, or a &#x3b3; with a &#x3b4; chain, in heterodimeric form (<xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B10">10</xref>). During thymic development, na&#xef;ve T cells are generated, each possessing a distinct specificity in their TCR. This specificity arises from somatic DNA recombination of V(D)J genes, where the resulting variable domains are spliced to the Constant (C) domain exons at the 3&#x2019; end and to the first exon (L-PART1; nomenclature according to IMGT, the international Immunogenetics database) of the signal (leader) peptide at the 5&#x2019; end (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>). Notably, the 5&#x2019; leader peptide in chicken V&#x3b1;1 genes is uniquely encoded within a single exon (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>). Somatic DNA recombination occurs separately for each chain and is essential for generating a vast diversity of antigen receptors. The process is initiated by the recombination activating genes (RAG) recombinase that binds to conserved recombination signal sequences (RSSs) flanking each V, D and J gene segment. RSSs contain conserved heptamers and nonamers separated by a 12- ( &#xb1; 1) or a 23-mer ( &#xb1; 1) spacer, governing V(D)J recombination according to the 12-23 rule (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>). The highly variable CDR3 at the V(D)J junction primarily interacts with the target peptide (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B15">15</xref>).</p>
<p>Previous work has identified V(D)J and C genes in the chicken genome that are arranged in highly structured clusters: The TCR &#x3b2; locus (TRB) spans a region of approximately 210 kilobases (kb) on chromosome 1 (<xref ref-type="bibr" rid="B16">16</xref>&#x2013;<xref ref-type="bibr" rid="B20">20</xref>), the TCR &#x3b3; locus (TRG) spans a region of approximately 82 kb on chromosome 2 (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B21">21</xref>&#x2013;<xref ref-type="bibr" rid="B23">23</xref>), and TCR &#x3b1; (TRA) and TCR &#x3b4; (TRD) genes are arranged in a hybrid locus of approximately 800 kb on chromosome 27, with the TCR &#x3b4; sequences nested between the V&#x3b1; and J&#x3b1; genes (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>, <xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B24">24</xref>). In addition, a separate small TCR &#x3b4;-like locus was identified on chromosome 10 comprised of a single cassette with one copy of immunoglobulin heavy chain (IgH) V-like VH&#x3b4;, D&#x3b4;, J&#x3b4; and C&#x3b4; genes (<xref ref-type="bibr" rid="B25">25</xref>). V(D)J genes recognized within each locus were organized into subfamilies, and classified based on their predicted functionality as either functional (F) genes, open reading frame (ORF) genes or pseudogenes (P) (<xref ref-type="bibr" rid="B26">26</xref>). Unfortunately, however, annotation efforts as part of different studies focusing on the same locus reached varying conclusions regarding the number of VJ genes and V families. The observed incongruity likely stems from inconsistent gene annotation methodologies and variations in the genomes utilized. Furthermore, the challenge of comparability has been exacerbated by instances where the annotated sequences were not universally accessible in the public domain (<xref ref-type="bibr" rid="B14">14</xref>, <xref ref-type="bibr" rid="B19">19</xref>). Recent studies have provided robust annotations of the TCR &#x3b2; and TCR &#x3b3; loci (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>). However, comprehensive details regarding the TCR &#x3b1;/&#x3b4; sequences are still unavailable.</p>
<p>In recent years, TCR repertoire sequencing has been widely used in mammals to dissect the intricacies of T cell-mediated immunity. TCR profiling enables the characterization of T cell diversity at baseline and facilitates quantification of clonal expansion and memory recall responses to microbial challenges (<xref ref-type="bibr" rid="B27">27</xref>, <xref ref-type="bibr" rid="B28">28</xref>). Current research endeavors have expanded this approach to chicken samples, offering a comprehensive analysis of private and public &#x3b2; and &#x3b3; T cell populations across various tissues and microbial conditions (<xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B29">29</xref>). However, current knowledge about chicken &#x3b1; and &#x3b4; chain sequences remains incomplete.</p>
<p>In this study, we set to address gaps in the annotation of <italic>Gallus gallus</italic> TCR loci and expanded upon previous investigations involving chicken TCR repertoires. Molecular barcoding of cDNA molecules with unique molecular identifiers (UMIs) was integrated in our pipeline, thereby enhancing the quantitative precision essential for comprehensive TCR repertoire analysis (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B31">31</xref>). We provide a comprehensive annotation of all TCR loci within the Huxu chicken genome and a TCR profiling pipeline with baseline data on the physiologic TCR &#x3b1;, &#x3b2;, &#x3b3; and &#x3b4; repertoires in the spleen. We developed a tool designed to streamline the annotation of chicken TCR genes in novel genome assemblies termed <italic>VJ-gene-finder</italic>, that was made accessible to the public along with all sequence data. This will provide the basis for new investigations into T cell-mediated immunity in chickens.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Animals</title>
<p>White Leghorn line M11 chickens (Friedrich-Loeffler-Institute, Federal Research Institute for Animal Health, Neustadt, Germany) were hatched and conventionally housed with ad libitum access to water and a commercial diet. Chickens were euthanized for tissue collection at 9 - 13 weeks of age. Splenic tissue was collected and stored in RNAlater (Sigma-Aldrich, Burlington, MA, USA) immediately post-mortem, then incubated for 24 hours at 4&#xb0;C followed by long-term storage at -20&#xb0;C.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>RNA</title>
<p>Ribonucleic acid (RNA) was extracted using the SV Total RNA Isolation System (Promega, Madison, WI, USA) with an on-column incubation with deoxyribonuclease I (DNase I), quantified on a Nanodrop ND-1000 (Thermo Fisher Scientific, Waltham, MA, USA) and RNA quality was determined on a 2100 Bioanalyzer (RNA Integrity Number &gt; 9) (Agilent Technologies, Santa Clara, CA, USA).</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Primer design for chicken TCR chains</title>
<p>For each TCR chain, an outer reverse 1 (<italic>R1</italic>) gene-specific primer for 5&#x2019; RACE and two nested primers (<italic>R2</italic> and <italic>R3</italic>) were designed to bind to C exons of &#x3b1; (GenBank EF554736), &#x3b2; (GenBank EF554782), &#x3b3; (GenBank NM_001318455) or &#x3b4; (GenBank AF175433) chains using Geneious Prime 2022.0.1 (<ext-link ext-link-type="uri" xlink:href="https://www.geneious.com/">https://www.geneious.com/</ext-link>). The <italic>R3</italic> for each chain was designed to bind close to the 5&#x2019; end of the C gene. Target-specificity was confirmed by NCBI Primer-BLAST against the <italic>Gallus gallus</italic> RefSeq messenger RNA (mRNA) database (<xref ref-type="bibr" rid="B32">32</xref>). Primer sequences are listed in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Primer sequences for TCR-specific 5&#x2019; RACE and PCR amplification.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Step</th>
<th valign="middle" align="left">Name</th>
<th valign="middle" align="left">Sequence</th>
<th valign="middle" align="left">F/R</th>
<th valign="middle" align="left">Chain</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">cDNA</td>
<td valign="middle" align="left">
<italic>SmartNNNNa*</italic>
</td>
<td valign="middle" align="left">
<italic>AAGCAGUGGTAUCAACGCAGAGUNNNNUNNNNUNNNNUCTTrGrGrGrG</italic>
</td>
<td valign="middle" align="left">F</td>
<td valign="middle" align="left">&#x3b1;&#x3b2;&#x3b3;&#x3b4;</td>
</tr>
<tr>
<td valign="middle" align="left">cDNA</td>
<td valign="middle" align="left">
<italic>chTRAC_R1</italic>
</td>
<td valign="middle" align="left">
<italic>CTGTCTTACTATCGACTGAG</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b1;</td>
</tr>
<tr>
<td valign="middle" align="left">cDNA</td>
<td valign="middle" align="left">
<italic>chTRBC_R1</italic>
</td>
<td valign="middle" align="left">
<italic>ACCTTCCAGACTAAATTGAG</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b2;</td>
</tr>
<tr>
<td valign="middle" align="left">cDNA</td>
<td valign="middle" align="left">
<italic>chTRGC_R1</italic>
</td>
<td valign="middle" align="left">
<italic>CATCGGTCCATTTCACCCGA</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b3;</td>
</tr>
<tr>
<td valign="middle" align="left">cDNA</td>
<td valign="middle" align="left">
<italic>chTRDC_R1</italic>
</td>
<td valign="middle" align="left">
<italic>TCATTAGAGGACATCTCCAAA</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b4;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR1</td>
<td valign="middle" align="left">
<italic>Smart20*</italic>
</td>
<td valign="middle" align="left">
<italic>CACTCTATCCGACAAGCAGTGGTATCAACGCAG</italic>
</td>
<td valign="middle" align="left">F</td>
<td valign="middle" align="left">&#x3b1;&#x3b2;&#x3b3;&#x3b4;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR1</td>
<td valign="middle" align="left">
<italic>chTRAC_R2</italic>
</td>
<td valign="middle" align="left">
<italic>GGTCAGCCTGTAGACTGAAGG</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b1;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR1</td>
<td valign="middle" align="left">
<italic>chTRBC_R2</italic>
</td>
<td valign="middle" align="left">
<italic>TGCTTTGATGGTGAAAAGATGACC</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b2;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR1</td>
<td valign="middle" align="left">
<italic>chTRGC_R2</italic>
</td>
<td valign="middle" align="left">
<italic>TCATGTTCCTCCTGCATGATTTC</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b3;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR1</td>
<td valign="middle" align="left">
<italic>chTRDC_R2</italic>
</td>
<td valign="middle" align="left">
<italic>TGATTTCATCACAATGACCTCTGG</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b4;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR2</td>
<td valign="middle" align="left">
<italic>Step_1*</italic>
</td>
<td valign="middle" align="left">
<italic>(acactctttccctacacgacgctcttccgatct)XXXXXCACTCTATCCGACAAGCAGT</italic>
</td>
<td valign="middle" align="left">F</td>
<td valign="middle" align="left">&#x3b1;&#x3b2;&#x3b3;&#x3b4;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR2</td>
<td valign="middle" align="left">
<italic>chTRAC_R3</italic>
</td>
<td valign="middle" align="left">
<italic>(gactggagttcagacgtgtgctcttccgatct)XXXXXGTAGACTGAAGGAGATGGAGTAAT</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b1;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR2</td>
<td valign="middle" align="left">
<italic>chTRBC_R3</italic>
</td>
<td valign="middle" align="left">
<italic>(gactggagttcagacgtgtgctcttccgatct)XXXXXGGTTCTATGATTTCACTGTTCTTCC</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b2;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR2</td>
<td valign="middle" align="left">
<italic>chTRGC_R3</italic>
</td>
<td valign="middle" align="left">
<italic>(gactggagttcagacgtgtgctcttccgatct)XXXXXCTGGTGCTGAACTTCCTTTGTC</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b3;</td>
</tr>
<tr>
<td valign="middle" align="left">PCR2</td>
<td valign="middle" align="left">
<italic>chTRDC_R3</italic>
</td>
<td valign="middle" align="left">
<italic>(gactggagttcagacgtgtgctcttccgatct)XXXXXGAATAGAATCTCTCTGCTCCC</italic>
</td>
<td valign="middle" align="left">R</td>
<td valign="middle" align="left">&#x3b4;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>*Adapted from (<xref ref-type="bibr" rid="B31">31</xref>); N = any nucleotide (<italic>A, T, G or C</italic>); <italic>rG</italic> = riboguanosine; <italic>U</italic> = deoxyuracil; () = overhang for library preparation; <italic>XXXXX</italic> = optional sample barcode; F = forward primer; R = reverse primer.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>
<italic>VJ-gene-finder</italic>
</title>
<p>A new search algorithm &#x201c;<italic>VJ-gene-finder&#x201d;</italic> was developed to identify and extract functional V and J genes from the chicken genome, based on characteristic biological patterns that define immunoglobulin V and J genes in many species (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B33">33</xref>). The features used include conserved amino acid residues at specific positions (for V segments according to IMGT nomenclature: &#x201c;1<sup>st</sup>-CYS&#x201d;, &#x201c;CONSERVED-TRP&#x201d; and &#x201c;YYC/YFC/YLC/YHC/YIC/TFC&#x201d; motif that includes the &#x201c;2<sup>nd</sup>-CYS&#x201d;; for J segments: &#x201c;FG&#x201d; motif), conserved nucleic acid motifs in genes and at specific positions (for V genes with a single-exon leader sequence: <italic>ATG</italic> start codon, for V genes with a spliced leader sequence: splice acceptor sequence <italic>AG</italic>; for J segments: <italic>TTYGGNNNNGG</italic> and <italic>TNNBNRT</italic>, and splice donor sequence <italic>GTRDGD</italic>) and conserved recombination signal sequences (for both V and J segments: begin with <italic>CAC</italic> nucleic acid motif) in combination with length constraints and the requirement for an open reading frame with or without splicing. A summary of the algorithm for V genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;1A, B</bold>
</xref>) and J genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;2A, B</bold>
</xref>) is included in the <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. <italic>VJ-gene-finder</italic> was written in Python and it was made publicly available as a free and open-source software (<ext-link ext-link-type="uri" xlink:href="https://github.com/simonfrueh/VJ-gene-finder">https://github.com/simonfrueh/VJ-gene-finder</ext-link>). The algorithm is similar to the method used by Oliveri et&#xa0;al. (<xref ref-type="bibr" rid="B33">33</xref>), but was modified to enable identification of chicken TCR V genes that are encoded by a single exon (together with the leader sequences) (<xref ref-type="bibr" rid="B13">13</xref>) and an additional function was added to search and extract J gene candidates. Additionally, <italic>VJ-gene-finder</italic> tentatively assigns candidate V genes to chicken V gene families based on amino acid motifs near the 5&#x2019;end (TRAV1: &#x201c;QVQQ&#x201d;, TRAV2: &#x201c;VSQQ&#x201d;, TRAV3: &#x201c;LQYP&#x201d;, TRBV1: &#x201c;LQQT&#x201d;, TRBV2: &#x201c;EINQ&#x201d;, TRBV3: &#x201c;ITQW, TRGV1: &#x201c;QVLLQQ&#x201d;, TRGV2: &#x201c;PIQS&#x201d;, TRGV3: &#x201c;QAVPMQ&#x201d; or &#x201c;QAAPVQ, TRGV4: &#x201c;LWQSP&#x201d;, TRDV1: &#x201c;ETSGGGV&#x201d;, TRDV2: &#x201c;LEASGGG&#x201d;, &#x201c;TRDV3: &#x201c;VEFGGDV&#x201d;, TRDV4: &#x201c;RIVEAG&#x201d;, TRDV5: &#x201c;EIHAKKSA&#x201d;, TRDVH1: &#x201c;QIEMVTT&#x201d;).</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Annotation of TCR loci</title>
<p>
<italic>VJ-gene-finder</italic> (v0.1) was used to identify putative V and J gene sequences that match the search criteria in chromosomes 1, 2, 27 and 10 of the Huxu chicken genome assembly GGswu (GenBank assembly GCA_024206055.2) (<xref ref-type="bibr" rid="B34">34</xref>). The search criteria were not specific to VJ segments, thus the algorithm also extracted non-VJ segments outside of the TCR loci. <italic>Clustal</italic> multiple sequence alignment of candidate sequences in Jalview revealed clusters of highly similar (functional) V and J genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;1C, 2C</bold>
</xref>) (<xref ref-type="bibr" rid="B35">35</xref>&#x2013;<xref ref-type="bibr" rid="B37">37</xref>). The chromosomal location of these genes defined the TCR locus for each TCR chain. <italic>VJ-gene-finder</italic> hits outside of the TCR locus were more dissimilar to each other and were discarded (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;1C, 2C</bold>
</xref>). Each putative V gene was manually annotated in Artemis Release 18.2.0 (<xref ref-type="bibr" rid="B38">38</xref>) and examined for the presence of predicted functional features, including a start codon, an RSS, leader sequences and splice sites using <italic>Recombination Signal Sequences Site</italic>, <italic>SignalP 6.0</italic> and <italic>Spliceator</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;1D</bold>
</xref>) (<xref ref-type="bibr" rid="B39">39</xref>&#x2013;<xref ref-type="bibr" rid="B41">41</xref>). J genes were manually annotated for the presence of a functional RSS and splice site using the same tools (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;2D</bold>
</xref>). By design, <italic>VJ-gene-finder</italic> only identified functional (F) and open reading frame (ORF) V and J genes (IMGT functionality nomenclature) (<xref ref-type="bibr" rid="B26">26</xref>). To identify V and J pseudogenes (P), potentially unidentified VJ F and ORF genes, and to detect D genes, TCR amplicon sequences were aligned to the Huxu chromosomes. These amplicons were generated in our laboratory as part of a different study from the same chicken line, following the same amplification strategy, with RNA from fluorescence-activated cell sorting (FACS)-isolated peripheral blood T cells. To enable partial and local alignment of spliced and rearranged TCR sequences to the un-rearranged genome, we employed the <italic>bowtie2</italic> (v2.3.5.1) aligner with options <italic>&#x2013;no-unal &#x2013;local</italic> (<xref ref-type="bibr" rid="B42">42</xref>). Raw reads were directly aligned to the reference sequence, converted to bam files, sorted and indexed using <italic>samtools</italic> (v1.15.1) and the alignment was visualized in <italic>Artemis</italic> (<xref ref-type="bibr" rid="B43">43</xref>). Regions with aligned partial TCR sequences were examined for the presence or absence of RSSs, splice sites, conserved amino acid and conserved nucleotide sequences as described above.</p>
<p>V genes were classified as functional when all conserved amino acids were identified, when a predicted 23-mer spacer (23)RSS was found at the 3&#x2019; end and the (spliced) leader sequence at the 5&#x2019; end encoded a predicted signal peptide, and frameshift mutations or stop codons were absent. The length of the V gene was defined ranging from the cleavage site of the signal peptide as predicted by <italic>SignalP 6.0</italic> to the beginning of the RSS (<italic>CAC</italic> motif) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;1A, B, D</bold>
</xref>). J genes were classified as functional only when stop codons were absent and when the conserved &#x201c;FG&#x201d; motif, a predicted 12-mer spacer (12)RSS at the 5&#x2019;end and a splice donor at the 3&#x2019; end were identified (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;2A, B, D</bold>
</xref>). The RSS and splice site also defined the beginning and end of the J gene. D genes were identified using <italic>bowtie2</italic> alignments and were defined as a sequence between a 12RSS and a 23RSS without any stop codons. Sequences without stop codons or frameshift mutations that were altered in one of the above-mentioned features were classified as ORFs. Sequences with aligned reads that contained stop codons, frameshift mutations or an RSS without <italic>CAC</italic> motif were assigned pseudogenes. Pseudogenes and the length of pseudogenes could not always be identified unambiguously because pseudogenes, by definition, lack certain characteristics that define immunoglobulin genes. All identified V(D)J genes and alterations (if applicable) are summarized in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>V family assignment, V and J gene numbering, CDR and FR annotation</title>
<p>TCR V genes with &#x2265;75% nucleotide sequence identity were grouped into V families following the nomenclature outlined by the international ImMunoGeneTics information system nomenclature (IMGT) (<xref ref-type="bibr" rid="B11">11</xref>). For V family assignment, DNA sequences of V genes were analyzed using EMBL-EBI online analysis tools (<xref ref-type="bibr" rid="B44">44</xref>). For each chain, V genes were aligned using Clustal Omega, clade consensus sequences were determined with <italic>EMBOSS Cons</italic> and percent identity to the group consensus was calculated with <italic>MView</italic> (<xref ref-type="bibr" rid="B45">45</xref>). The identity threshold for V gene families was 75%, except for TRGV2-27 that was assigned to the TRGV2 family with an identity of 73.8% compared to the group consensus. Chicken V families were assigned numbers based on established nomenclature from prior studies, where applicable (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B23">23</xref>). Additionally, new V families, including those within the &#x3b4; locus, as well as all V genes within each family, were numbered in ascending order from 5&#x2019; to 3&#x2019; (towards the C gene). Consistent with previous conventions in chickens, J genes were similarly numbered sequentially in ascending order from 5&#x2019; to 3&#x2019; direction, progressing towards the C gene (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>). CDR and framework (FR) regions were defined by alignment with <italic>IMGT/DomainGapAlign</italic> against Homo sapiens V Domain reference sequences (<xref ref-type="bibr" rid="B46">46</xref>). TRAJ genes were annotated based on the conserved &#x201c;F/WG.G&#x201d; motif. The reading frame of unconventional TRAJ genes that lacked the motif was examined in several individual sequencing reads and anchor points &#x201c;CDR3 end&#x201d; and &#x201c;FR4 begin&#x201d; were defined accordingly.</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Comparison to previous TCR gene annotations</title>
<p>Only full-length V genes &gt; 222 bp among the genes annotated in this study were considered for the sequence comparison. For each locus, reference sequences from previous studies were queried against the references sequences from this study by pairwise alignment with <italic>Biopython</italic> (v1.83) using <italic>pairwise2.align.globalxx()</italic> (<xref ref-type="bibr" rid="B47">47</xref>). Alignments were compared using the following formulas: 
<inline-formula>
<mml:math display="inline" id="im1">
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>t</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>y</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>p</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>h</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>o</mml:mi>
<mml:mi>f</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>s</mml:mi>
<mml:mi>h</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>s</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>q</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>100</mml:mn>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>and the <inline-formula>
<mml:math display="inline" id="im2">
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mtext mathvariant="italic">of </mml:mtext>
<mml:mi>m</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>=</mml:mo>
<mml:mi>l</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>h</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>o</mml:mi>
<mml:mi>f</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>s</mml:mi>
<mml:mi>h</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>s</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>q</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>p</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>s</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>. The best match with the highest percent identity, or multiple matches in case of equal percent identity, were reported for each query sequence.</p>
</sec>
<sec id="s2_8">
<label>2.8</label>
<title>Evolutionary analysis</title>
<p>Evolutionary analysis were conducted in <italic>MEGA11</italic> as previously described (<xref ref-type="bibr" rid="B48">48</xref>, <xref ref-type="bibr" rid="B49">49</xref>). In brief, all VJ (functional and ORF) DNA sequences annotated as part of these studies were aligned using <italic>MUSCLE</italic>. The best substitution model was identified by <italic>MEGA11</italic> (K2+G+I) and used to construct a Maximum Likelihood Tree (with partial deletion option). The reliability of the tree was estimated with 500 bootstrap replicates and the tree was visualized using <italic>iTOL v6</italic> (<xref ref-type="bibr" rid="B50">50</xref>). Dotplots were created with <italic>Unipro UGENE</italic> (v48.1) with a minimum repeat length of 100 bp and a repeat identity threshold of 100% (<xref ref-type="bibr" rid="B51">51</xref>). Locus representation plots were created with <italic>DNA Features Viewer</italic> (v3.1.3) (<xref ref-type="bibr" rid="B52">52</xref>).</p>
</sec>
<sec id="s2_9">
<label>2.9</label>
<title>5&#x2019; RACE</title>
<p>A previously described approach for TCR-specific 5&#x2019; RACE was modified for chicken samples (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B53">53</xref>). A UMI was included in the template switching oligo for <italic>in silico</italic> removal of polymerase chain reaction (PCR) duplicates and improved error correction (<xref ref-type="bibr" rid="B30">30</xref>). In addition, 5-nucleotide sample barcodes were added at the 5&#x2019; end to the primers of the second PCR (chain-specific) for demultiplexing of pooled samples (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). Depending on the sequencing provider and the library preparation method, specific adapters sequences can also be added to the primers of the second PCR (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B54">54</xref>). In this study, the PCR 2 oligonucleotides contained the following adapter sequences: <italic>ACACTCTTTCCCTACACGACGCTCTTCCGATCT</italic> (forward primer) and <italic>GACTGGAGTTCAGACGTGTGCTCTTCCGATCT</italic> (reverse primer). For first strand cDNA synthesis with template switching, 500 ng of purified total RNA in 3 &#x3bc;l nuclease-free water were combined with 1.5 &#x3bc;l antisense primer mix containing equal amounts of 10 &#x3bc;M reverse primers (<italic>chTRAC_R1</italic> and <italic>chTRBC_R1</italic> for amplification of &#x3b1;&#x3b2; TCRs or <italic>chTRGC_R1</italic> and <italic>chTRDC_R1</italic> for amplification of &#x3b3;&#x3b4; TCRs). The template-antisense primer mixture was incubated at 72&#xb0;C for 3 minutes and at 42&#xb0;C for 2 minutes. Then 5.5 &#x3bc;l of reverse transcription master mix containing 2 &#x3bc;l of 5x First-Strand Buffer, 0.25 &#x3bc;l of 100 mM DL-Dithiothreitol, 1 &#x3bc;l of deoxynucleotide triphosphates (dNTPs) (10 mM each) (both Promega, Madison, WI, USA), 1 &#x3bc;l of 10 &#x3bc;M <italic>SmartNNNNa</italic> primer, 0.25 &#x3bc;l of ribonuclease (RNase) Inhibitor (40 U/&#x3bc;l) and 1 &#x3bc;l SMARTScribe Reverse Transcriptase (both Takara Bio, Kusatsu, Shiga, Japan) was added to each sample and the first strand synthesized by incubation at 42&#xb0;C for 90 minutes and at 70&#xb0;C for 10 minutes. The cDNA was cooled on ice, then 5 &#x3bc;l USER Enzyme (1 U/&#x3bc;l) (New England Biolabs, Ipswich, MA, USA) was added and the mixture was incubated at 37&#xb0;C for 60 minutes. cDNA was stored at -20&#xb0;C.</p>
</sec>
<sec id="s2_10">
<label>2.10</label>
<title>Polymerase chain reaction and amplicon next generation sequencing</title>
<p>For the first PCR (PCR 1), 5 &#x3bc;l of template cDNA was combined with 35 &#x3bc;l nuclease-free water, 5 &#x3bc;l 10x Advantage 2 PCR Buffer, 1 &#x3bc;l dNTPs (10 mM each) (Promega, Madison, WI, USA), 1 &#x3bc;l Smart20 primer (10 &#x3bc;M), 2 &#x3bc;l antisense primer mix containing equal amounts of 10 &#x3bc;M reverse primers (<italic>chTRAC_R2</italic> and <italic>chTRBC_R2</italic> for amplification of &#x3b1;&#x3b2; TCRs or <italic>chTRGC_R2</italic> and <italic>chTRDC_R2</italic> for amplification of &#x3b3;&#x3b4; TCRs) and 1 &#x3bc;l 50x Advantage 2 Polymerase Mix (Takara Bio, Kusatsu, Shiga, Japan). PCR 1 was carried out by incubation at 95&#xb0;C for 1 minute, followed by 19 repeated cycles of incubation at 95&#xb0;C for 20 seconds (s), 65&#xb0;C for 20 s and 68&#xb0;C for 50 s, followed by a final extension at 68&#xb0;C for 3 minutes. PCR 1 amplicons were purified with AMPure XP beads (Beckman Coulter, Brea, CA, USA) using a ratio of PCR 1 Reaction Volume (&#x3bc;l): AMPure XP Volume (&#x3bc;l) of 1: 0.65, with two washes with 80% Ethanol on a SMARTer-Seq Magnetic Separator (Takara Bio, Kusatsu, Shiga, Japan) and elution in 27 &#x3bc;l nuclease-free water. The second PCR (PCR 2) was carried out separately for each TCR chain. The reaction mix contained 19.5 &#x3bc;l nuclease-free water, 2.5 &#x3bc;l 10x Advantage 2 PCR Buffer, 0.5 &#x3bc;l dNTPs (10 mM each), 0.5 &#x3bc;l <italic>Step_1</italic> primer (10 &#x3bc;M), 0.5 &#x3bc;l <italic>R3</italic> chain-specific reverse primer (10 &#x3bc;M), 0.5 &#x3bc;l 50x Advantage 2 Polymerase Mix with 1 &#x3bc;l purified PCR 1 product as template. For &#x3b4; chains, 2 &#x3bc;l purified PCR 1 product was used as template. The PCR 2 cycling conditions were the same as for PCR 1, except with a different number of repeated cycles (13 cycles for &#x3b1;, 11 cycles for &#x3b2;, 15 cycles for &#x3b3; and 15 cycles for &#x3b4;). PCR 2 amplicons were purified by gel electrophoresis on a 1.25% Agarose gel with Novel Juice DNA stain (Sigma-Aldrich, Burlington, MA, USA), excision of bands of the desired size [~600 - 650 base pairs (bp)] on a blue light table and gel extraction with the Monarch DNA Gel Extraction Kit (New England Biolabs, Ipswich, MA, USA). Of note, in some cases (particularly with &#x3b1; and &#x3b3; chain amplicons), secondary bands ~100 - 200 bp larger than the desired size were observed, which were likely cDNA molecules with long UTRs and/or incomplete or false splicing. Those extra bands were excluded during gel extraction. Purified PCR 2 amplicons were quantified with a Quantus Fluorometer and the QuantiFluor dsDNA System (both Promega, Madison, WI, USA). Library preparation (2<sup>nd</sup> PCR Amplicon option) and paired-end sequencing at 2x300 bp on an Illumina MiSeq Instrument (Illumina, San Diego, USA) was performed by Eurofins Genomics Germany GmbH (Ebersberg, Germany).</p>
</sec>
<sec id="s2_11">
<label>2.11</label>
<title>Quality control and TCR sequence analysis</title>
<p>The quality of raw reads was determined using <italic>fastqc</italic> (v0.11.9) and <italic>MultiQC</italic> (v1.15) (<xref ref-type="bibr" rid="B55">55</xref>, <xref ref-type="bibr" rid="B56">56</xref>) and reads were analyzed with <italic>MiXCR</italic> (v4.2.0) ( (<xref ref-type="bibr" rid="B57">57</xref>). A custom germline V(D)J library containing chicken &#x3b1;, &#x3b2;, &#x3b3; and &#x3b4; chain sequences was created with <italic>repseqio</italic> (v1.3.5) [now part of <italic>MiXCR</italic> (v4)]. In brief, all functional and ORF segments (annotated in this study) were exported as Fasta files and converted into a JSON structured library with <italic>repseqio</italic> using the <italic>fromPaddedFasta</italic> option. Anchor points were specified manually for V genes <italic>(-FR1Begin, -CDR1Begin, -FR2Begin, -CDR2Begin, -FR3Begin, -CDR3Begin, -VEnd</italic>), D genes (<italic>-DBegin, -DEnd)</italic> and J genes (<italic>-JBegin, -FR4Begin, -FR4End</italic>) and annotated sequences were compiled into one chicken VDJ library with <italic>repseqio merge</italic>. This library was used in <italic>MiXCR</italic> to align and annotate TCR sequences. Alignment (<italic>mixcr align</italic>) was used with options <italic>-p generic-tcr-amplicon-umi</italic>, <italic>-OallowChimeras=true, &#x2013;tag-parse-unstranded</italic>, <italic>&#x2013;rna</italic>, <italic>&#x2013;rigid-left-alignment-boundary</italic>, <italic>&#x2013;floating-right-alignment-boundary C</italic>, <italic>&#x2013;tag pattern &#x2018;^*(UMI : TNNNNTNNNNTNNNNT)ctt(R1:*)\^(R2:*)&#x2019;</italic>. Tags were refined with <italic>mixcr refineTagsAndSort</italic>, CDR3 clonotypes were assembled with <italic>mixcr assemble</italic> and clonotype tables exported with <italic>mixcr exportClones</italic>. Clonotype tables were randomly downsampled within each chain to the weighted total number of clonotypes of the smallest sample and analyzed and visualized using <italic>Jupyter Notebook</italic> (v7.0.6) with <italic>python</italic> (v3.11.7), <italic>matplotlib</italic> (v3.8.2), <italic>numpy</italic> (v1.26.2), <italic>pandas</italic> (v2.1.3), <italic>scipy</italic> (v1.11.4) and <italic>seaborn</italic> (v0.13.0) (<xref ref-type="bibr" rid="B58">58</xref>&#x2013;<xref ref-type="bibr" rid="B62">62</xref>). Additional analyses were conducted using <italic>R</italic> software (v4.3.2) with <italic>resphape2</italic> (v1.4.4) and <italic>tidyverse</italic> packages (v2.0.0) (<xref ref-type="bibr" rid="B63">63</xref>, <xref ref-type="bibr" rid="B64">64</xref>).</p>
</sec>
<sec id="s2_12">
<label>2.12</label>
<title>Statistical analysis</title>
<p>Statistical analyses were conducted using <italic>R</italic> software (v4.3.2). A negative binomial generalized linear model (GLM) was fitted to account for overdispersion, with counts of T cell receptor sequences or counts of amino acids in T cell receptor sequences as the response variable and V gene type, V family type, J gene type, or amino acid type as predictors. This analysis was performed using the <italic>glm.nb()</italic> function from the <italic>MASS</italic> package (v7.3-60) (<xref ref-type="bibr" rid="B65">65</xref>). The overall significance of predictors in the model was assessed through analysis of deviance tests using the <italic>Anova()</italic> function from the <italic>car</italic> package (v3.1-2) (<xref ref-type="bibr" rid="B66">66</xref>). For <italic>post-hoc</italic> pairwise comparisons among levels of the predictors, the <italic>emmeans</italic> package (v1.10.0) was employed, applying Tukey adjustment for multiple comparisons (<xref ref-type="bibr" rid="B67">67</xref>).</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>The chicken TCR loci</title>
<p>Our goal was to establish a targeted TCR repertoire analysis for all four chicken TCR chains using Next Generation Sequencing (NGS). Bioinformatic analysis of expressed TCRs relies upon a comprehensive annotation of the germline V(D)J repertoire, enabling identification of functional regions (FRs, CDRs) and germline gene identity. To generate an updated and systematic annotation of the chicken TCR loci, we semi-automatically extracted VJ genes from TCR loci within the recent Huxu chicken genome assembly (<xref ref-type="bibr" rid="B34">34</xref>) using <italic>VJ-gene-finder</italic>, a program that was generated as part of this study. The search algorithm of <italic>VJ-gene-finder</italic> is based on the method by Olivieri et&#xa0;al., with chicken-specific adjustments to the motif criteria and new functionality for extraction of putative J genes and V genes with a single-exon leader peptide (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;1A, B, 2A, B</bold>
</xref>) (<xref ref-type="bibr" rid="B33">33</xref>). <italic>VJ-gene-finder</italic> hits were manually curated and functional RSSs, splice sites and signal peptides were verified (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;1C, D, 2C, D</bold>
</xref>). Pseudogenes and additional genes, not identified by <italic>VJ-gene-finder</italic>&#x2019;s search parameters, were manually annotated. This annotation process was facilitated by the local (partial) alignment of raw reads from TCR amplicons, generated using the amplification strategy described in this study, directly to the genome. In summary, a total of 282 TCR gene segments was identified (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f3">
<bold>3</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>). <italic>VJ-gene-finder</italic> recognized 164 of 169 total functional (F) and open reading frame (ORF) V genes and 67 of 74 total J genes. All V(D)J genes, except TRBV2-4, were located on the reverse strand and each locus comprised only a single C gene. TCR V genes exhibiting &#x2265;75% sequence identity at the nucleotide level were grouped into V families, facilitating classification and analysis.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The chicken TCR &#x3b1;/&#x3b4; locus on chromosome 27. To-scale representation of the TCR &#x3b1;/&#x3b4; hybrid locus within the reverse strand on chromosome 27 (Huxu chicken genome) with V(D)JC genes labeled, and summary tables with total gene counts. The DNA segment presented was specifically chosen to cover the entire TCR locus. Gene names composed of chain (TRA = TCR &#x3b1;, TRD = TCR &#x3b4;), type (V, variable; D, diversity; J, joining), family, and an individual number (in ascending order) separated by a dash. &#x201c;p&#x201d; prefix indicates pseudogenes and &#x201c;orf&#x201d; prefix indicates open reading frames. The region containing the TCR &#x3b4; locus was indicated by a blue bar. Only the first exon of the constant (C) gene was depicted.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g001.tif"/>
</fig>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>The chicken TCR &#x3b2; locus on chromosome 1. To-scale representation of the TCR &#x3b2; locus within the reverse strand on chromosome 1 (Huxu chicken genome) with VDJC genes labeled, and a summary table with total gene counts. The DNA segment presented was specifically chosen to cover the entire TCR locus. Gene names composed of chain (TRB = TCR &#x3b2;), type (V, variable; D, diversity; J, joining), family, and an individual number (in ascending order) separated by a dash. &#x201c;p&#x201d; prefix indicates pseudogenes and &#x201c;orf&#x201d; prefix indicates open reading frames.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g002.tif"/>
</fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>The chicken TCR &#x3b3; locus on chromosome 2. To-scale representation of the TCR &#x3b3; locus within the reverse strand on chromosome 2 (Huxu chicken genome) with VJC genes labeled, and a summary table with total gene counts. The DNA segment presented was specifically chosen to cover the entire TCR locus. Gene names composed of chain (TRG = TCR &#x3b3;), type (V, variable; D, diversity; J, joining), family, and an individual number (in ascending order) separated by a dash. &#x201c;p&#x201d; prefix indicates pseudogenes and &#x201c;orf&#x201d; prefix indicates open reading frames.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g003.tif"/>
</fig>
<p>The TCR &#x3b1;/&#x3b4; locus spanned ~970 kb on chromosome 27, with TCR &#x3b4; occupying approximately 310 kb (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). 72 V&#x3b1; segments were clustered in three families, TRAV1 (T cell receptor alpha Variable family 1) with 48 genes (of which 12 were pseudogenes), TRAV2 with 23 genes and a single TRAV3 gene adjacent to the TCR &#x3b4; locus (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Files 1, 2</bold>
</xref>). All TRAV1 family members except TRAV1-21 (TRAV1 family member number 21), TRAV1-47 and TRAV1-49 encoded a leader peptide in a single exon with the V gene. The majority of TRAV1 member were classified as ORF genes due to a low mean recombination information content (RIC) score of the RSSs (a score that is used to predict physiological RSSs; the score was calculated by <italic>RSSsite</italic> and is defined as the natural logarithm of marginal and joint probability functions of mutually correlated positions), or as pseudogenes containing stop codon or frameshift mutations (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B68">68</xref>). The &#x3b1; locus contained 64 TRAJ genes, with 7 classified as ORF lacking the conventional &#x201c;W/FG.G&#x201d; amino acid motif, or due to a low RIC score of the RSS.</p>
<p>The TCR &#x3b4; locus was nested between TRAJ and TRAV genes and contained 5&#xa0;V families, 2 TRDD genes, 2 TRDJ genes and a single TRDC gene. The TRDV1 family, consisting of 41 genes (including 3 pseudogenes), was the largest, while the TRDV2, TRDV3, TRDV4, and TRDV5 families comprised 3, 1, 9 and 3 members, respectively. All TRDV4 genes were ORFs lacking predicted L-PART1 sequences in proximity to the 5&#x2019; end. The non-conventional TCR &#x3b4;-like locus on chromosome 10 comprised a set of single VDJC genes with an IgH V-like VH&#x3b4; gene, classified ORF due to a low RIC score RSS and the lack of a corresponding L-PART1 sequence that, when spliced to the TRDVH1 gene, would lead to a functional signal peptide.</p>
<p>The TCR &#x3b2; locus, located on chromosome 1 spanning approximately 211 kb, exhibited fewer genes with a total of 16 TRBV genes, that were all functional (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Files 3, 4</bold>
</xref>). Those occurred in three families, ordered from 5&#x2019; to 3&#x2019;, with 11 TRBV1 genes followed by 3 TRBV2 genes and one TRBV3 gene, followed by a single D gene, 4 J genes and a single C gene. Additionally, downstream of the C gene, there was a single V gene (TRBV2-4) in an inverted orientation on the forward strand.</p>
<p>In comparison to the TCR &#x3b2; locus, the &#x3b3; locus on chromosome 2 was more densely packed, containing 53&#xa0;V genes in four families spread across ~109 kb (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Files 5, 6</bold>
</xref>). Notably, a higher proportion of pseudogenes (28% of V&#x3b3; genes) was identified in the &#x3b3; locus compared to the other TCR loci. Nine out of 15 pseudogenes were incomplete fragments of V genes with short stretches of sequence similarity and a predicted RSS, leading to a low-confidence assignment to a specific V gene family. Most members of the TRGV1 family encoded a single-exon leader peptide, mirroring the structure seen in TRAV1 genes. However, their likelihood of containing functional signal peptides was low, as predicted by <italic>SignalP 6.0</italic>. Consequently, they were classified as ORFs, unless additional defects were detected, prompting classification as pseudogenes. In sum, we detected 8 TRGV1 genes (with 2 pseudogenes), 27 TRGV2 genes (with 8 pseudogenes), 10 TRGV3 genes (no pseudogenes), 8 TRGV4 genes (with 5 pseudogenes), 3 TRGJ genes and 1 TRGC gene.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Evolutionary relationships</title>
<p>Next, we wanted to analyze the genomic landscape of the TCR loci. Dotplot analysis revealed long stretches of sequence repeats separated by insertions and deletions in all loci, a pattern that is consistent with an evolutionary history shaped by duplication of homology units (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>) (<xref ref-type="bibr" rid="B69">69</xref>). The regions of sequence similarity were much longer than the VDJ gene segments themselves and spanned across exons and non-coding sequences. We also detected inverted repeats in the TCR &#x3b2; locus. Overall, the TCR loci were low-complexity regions, with redundancy predominantly in genomic regions that contained V genes. Remarkably, repeats in the &#x3b1;/&#x3b4; locus were contained within regions of the same chain (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>). This separation indicated that sequence duplication events were constrained and occurred separately for each chain, or that inter-chain duplication events in this locus were more ancient.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Dotplots of TCR loci indicating long sequence repeats spanning exons and non-coding regions. The DNA sequence of each TCR locus was aligned against itself, indicating sequence repeats with dots and inverted repeats with red dots (minimum repeat length of 100 bp; repeat identity threshold of 100%). Linear locus representations with TCR gene annotations were included on the x axis for reference. Dotplots of the <bold>(A)</bold> TCR &#x3b1;/&#x3b4; locus, <bold>(B)</bold> TCR &#x3b2; locus, and <bold>(C)</bold> TCR &#x3b3; locus.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g004.tif"/>
</fig>
<p>The overall landscape of repeats in the dotplot (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>) reflected the topology of repeating units that could be observed in the genome locus representations (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f3">
<bold>3</bold>
</xref>). Across the &#x3b1; chain locus, pairs of TRAV1 and TRAV2 genes ~2 kb apart occurred repeatedly, with some variations in the pattern (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). In the dotplot, three clusters of &#x3b1; chain sequence repeats became apparent, a small cluster of repeats around the J genes, a larger cluster of repeats at ~400 - 650 kb with more V genes dispersed between TRAV1/TRAV2 pairs, and, although with some sequence overlap, a distinct cluster with more loosely arranged V genes (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>). The sequence repeats around the V&#x3b4; genes formed two clusters: A small cluster at ~310 - 380 kb, predominantly comprised of TRDV1 genes with three TRDV2 and one TRDV1 gene interspersed, and a larger cluster that also contained TRDV4 and TRDV5 family genes (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4A</bold>
</xref>). The repeats around the V&#x3b2; genes were separated in two clusters by family, indicating separate evolution of TRBV genes by duplication of homology units and/or early separation from a common ancestral sequence (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>). In the TCR &#x3b3; locus, long stretches of homology units occurred up to 5 times, and a pattern of repeating units of TRGV4 - TRGV1 - TRGV3 - TRGV2 (1 to 5 TRGV2 genes) with some variations was observed, in agreement with previous reports (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4C</bold>
</xref>) (<xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>).</p>
<p>Next, we constructed a Maximum Likelihood tree of all F and ORF V genes to characterize the evolutionary relationship between V genes of different TCR loci (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). Reliability of the tree was estimated with the bootstrap method (500 bootstrap replicates). Notably, V sequences separated according to the chain type, except for all three TRDV5 sequences that clustered with the TRA genes and formed a distinct clade with the single TRAV3 gene. In addition, the single TRDVH1 gene from chromosome 10 was quite distinct from TRDV1-4 genes. Overall, the tree supported V family classification, as V families were separated in distinct clades. Members of any given V family shared a high degree of sequence similarity, leading to short branch lengths and poor tree resolution. To better highlight the topology of the tree at the branch tips, unscaled representations of the phylogenetic tree were constructed, with specific nodes collapsed (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;3</bold>
</xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Phylogenetic tree of chicken TRV genes. An unrooted Maximum Likelihood Tree displaying F and ORF TRV genes. Gene names at branch tips were replaced with their respective gene family names and counts in parentheses for improved readability.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g005.tif"/>
</fig>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>The splenic TCR repertoire</title>
<p>With a complete genome annotation of VDJC gene segments at hand, our goal was to establish an approach for amplification and annotation of the expressed TCR repertoire in chickens. We based our method on a protocol described by Mamedov et&#xa0;al. for 5&#x2019;RACE with C gene-specific reverse primers and subsequent amplification of TCR sequences by two rounds of PCR (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B54">54</xref>). New chicken-specific reverse primer sets were established, and a UMI was included in the template switch oligo (TSO = <italic>&#x201c;SmartNNNNa&#x201d;</italic>) (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). This molecular barcoding of the cDNA enabled deconvolution of PCR copies and duplicates of expressed cDNA during subsequent bioinformatic analysis, leading to more precise quantification.</p>
<p>Next, we wanted to characterize the TCR repertoire in the chicken spleen, as a proof of concept, and to collect baseline data on the TCR diversity in this major lymphoid organ. We amplified TCR sequences from splenic total RNA of three chickens and sequenced purified amplicons with a read length of 2x300 bp. Raw sequences were then analyzed with <italic>MiXCR</italic> (<xref ref-type="bibr" rid="B57">57</xref>). As a reference for automated alignment and clonotype assembly of TCR sequences by <italic>MiXCR</italic>, a custom chicken V(D)J library was created from all F and ORF genes annotated in this study. Anchor points that delineate CDR1-CDR3 and surrounding FR were specified for each gene. The CDR3 was defined as the target region in <italic>MiXCR</italic> due to its high sequence variability and its critical role in peptide binding. After processing in <italic>MiXCR</italic>, high-level downstream analysis of 4,000 - 10,000 clonotypes (after downsampling) per chain was performed in <italic>Python</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;4A&#x2013;D</bold>
</xref>). The repertoires of each chain were predominantly comprised of unique nucleotide clonotypes that were only represented by a single cDNA molecule in the analyzed pool (only a single UMI barcode per clonotype that passed the reads per UMI thresholds in MiXCR), with some clonotypes exhibiting higher UMI per clonotype counts (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;4E&#x2013;H</bold>
</xref>). For each chain, we analyzed V(D)J gene and &#x2013; family usage, CDR3 spectratypes, clonotype rank abundance, publicity, top clonotype sharing and CDR3 amino acid usage.</p>
<p>Strikingly, despite a lower count of TRAV2 genes in the genome (23&#xa0;F and ORF genes vs. 36 TRAV1), &#x3b1;&#x3b2; T cells in the spleen predominantly expressed TRAV2 genes (&gt; 90%), while TRAV1 genes and the single TRAV3 gene were detected at very low frequency (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A, C</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;5A</bold>
</xref>). This contradicted a simple positive correlation between gene count and gene expression, indicating that other regulatory mechanisms likely contributed to this strong V gene expression bias. One such regulatory factor could be the RSS sequence, since a high proportion of TRAV1 genes were ORFs with a low RIC score RSS (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>). Individual TRDV1 and TRDV2 genes formed V &#x3b1;/&#x3b4; chimeric receptors with TCR &#x3b1; genes, as was previously reported by Liu et&#xa0;al., with chimeric receptors detected at very low frequency in all three samples (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A, C</bold>
</xref>). J gene utilization also strongly favored specific J genes, of which TRAJ25 and TRAJ6 had the highest number of transcripts (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;6A</bold>
</xref>). The combinations of VJ segments with the highest expression were TRAV2-22 - TRAJ6 and TRAV2-3 - TRAJ25 (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6D</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;7</bold>
</xref>). The TCR &#x3b1; CDR3 spectratype was calculated and showed a Gaussian-like distribution (centered at 14 - 15 amino acids) indicative of an unbiased TCR repertoire without dominant clonally expanded clonotypes (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B70">70</xref>, <xref ref-type="bibr" rid="B71">71</xref>) (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6E</bold>
</xref>). The phenotype of an unbiased repertoire was reinforced by the distribution of clonotype index groups based on their relative frequencies, wherein all clonotypes within the TCR repertoire were ranked by abundance and grouped according to their indices (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6F</bold>
</xref>). The analysis revealed that the highest-ranked clonotypes accounted for a minor fraction of the overall repertoire. Furthermore, the color-coded TCR spectratypes representing the proportions of the top 10 most prevalent V genes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;8A&#x2013;C</bold>
</xref>) exhibited distributions typical of unbiased repertoires. Roughly 10% of the TCR &#x3b1; repertoire was occupied by &#x201c;public&#x201d; clonotypes (present in all three samples), ~5-10% by clonotypes expressed in 2 samples and &gt;80% were &#x201c;private&#x201d; TCR clonotypes (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6G</bold>
</xref>). Interestingly, the majority of the top 10 clonotypes in each sample were also present at similar frequencies in the two other samples (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;9A&#x2013;C</bold>
</xref>). None of the clonotypes exhibited expansion beyond 0.5% of the repertoire. Converging CDR3s, representing distinct nucleic acid sequences encoding identical CDR3 amino acid sequences, constituted approximately 20% of the TCR &#x3b1; repertoire (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;10A, B</bold>
</xref>). A maximum of 12 distinct sequences encoding the same CDR3 were identified, serving as a potential biomarker for antigen-specific T cell responses (<xref ref-type="bibr" rid="B72">72</xref>). The amino acid composition of the CDR3 showed that Glycine and Alanine were most prevalent, with an overall high proportion of polar neutral amino acids, and low frequencies of acidic and alkaline amino acids (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6H</bold>
</xref>).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>The TCR &#x3b1; chain repertoire expressed in the chicken spleen. TCR &#x3b1; chain amplicons were sequenced at 2x300 bp, followed by alignment and clonotype assembly using <italic>MiXCR</italic> software with a VDJ germline library comprised of the sequences annotated in this study. <bold>(A)</bold> Clustermap displaying V gene utilization for each sample featuring gene counts and color-coded relative frequencies in the heatmap. Row colors denote V family: green (TRAV1), yellow (TRAV2), red (TRAV3), grey (non-TRA V gene). <bold>(B)</bold> Clustermap displaying J gene utilization for each sample featuring gene counts and color-coded relative frequencies in the heatmap. <bold>(C)</bold> Log count of TCR clonotypes grouped by V family in the TCR &#x3b1; chain repertoire. <bold>(D)</bold> Bubble grid plot illustrating relative frequencies of V-J pairings, indicated by bubble size and color-coding. <bold>(E)</bold> CDR3 spectratype displaying the distribution of CDR3 amino acids lengths with frequency-weighted counts. <bold>(F)</bold> Rank abundance plot depicting the proportion of the TCR repertoire occupied by clonotype groups arranged by clonotype abundance rank. <bold>(G)</bold> Proportional abundance of clonotypes categorized by their prevalence across three samples. <bold>(H)</bold> Barplot showing mean counts of individual amino acids in the CDR3. <bold>(C, H)</bold> Mean &#xb1; 95% confidence intervals; Means not sharing any letter are significantly different by the Tukey-test at the 5% level of significance.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g006.tif"/>
</fig>
<p>The corresponding TCR &#x3b2; repertoire primarily consisted of around 80-90% TRBV1-family clonotypes, approximately 10-20% sequences derived from TRBV2, and a minority of TCRs featuring the TRBV3-1 gene (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7C</bold>
</xref>). In the observed T cell repertoire, the most frequently utilized V and J genes were TRBV1-8, TRBV1-10, TRBJ3 and TRBJ1, with high expression levels across all J genes (<xref ref-type="fig" rid="f7">
<bold>Figures&#xa0;7A, B</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;5B, 6B</bold>
</xref>). TRBV1-8 was predominantly paired with TRBJ1 (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7D</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;11</bold>
</xref>). The repertoire was unbiased with no preferentially expanded clones (&#x2265;0.5% as defined by Dascalu et al.) and a low degree of convergence (<xref ref-type="fig" rid="f7">
<bold>Figures&#xa0;7E, F</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;8D&#x2013;F, 9D&#x2013;F, 10C&#x2013;D</bold>
</xref>) (<xref ref-type="bibr" rid="B29">29</xref>). The ranked clonotype abundance distribution closely mirrored the clonal homeostasis proportions reported by Dascalu et&#xa0;al. for the spleen, indicative of a large proportion of na&#xef;ve T cells (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7F</bold>
</xref>). Minimal overlap was observed among the top 10 most prevalent clonotypes when compared across the other two samples and virtually all clonotypes were private (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7G</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;9D&#x2013;F</bold>
</xref>). The amino acid distribution in the CDR3 was overall comparable to &#x3b1; chain CDR3s, with some variation, including a higher proportion of Isoleucine (I), Asparagine (N) and Arginine (R), and relatively fewer Valine (V), Serine (S) and Threonine (T) residues (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7H</bold>
</xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>The TCR &#x3b2; chain repertoire expressed in the chicken spleen. TCR &#x3b2; chain amplicons were sequenced at 2x300 bp, followed by alignment and clonotype assembly using <italic>MiXCR</italic> software with a VDJ germline library comprised of the sequences annotated in this study. <bold>(A)</bold> Clustermap displaying V gene utilization for each sample featuring gene counts and color-coded relative frequencies in the heatmap. Row colors denote V family: green (TRBV1), yellow (TRBV2), red (TRBV3). <bold>(B)</bold> Clustermap displaying J gene utilization for each sample featuring gene counts and color-coded relative frequencies in the heatmap. <bold>(C)</bold> Log count of TCR clonotypes grouped by V family in the TCR &#x3b2; chain repertoire. <bold>(D)</bold> Bubble grid plot illustrating relative frequencies of V-J pairings, indicated by bubble size and color-coding. <bold>(E)</bold> CDR3 spectratype displaying the distribution of CDR3 amino acids lengths with frequency-weighted counts. <bold>(F)</bold> Rank abundance plot depicting the proportion of the TCR repertoire occupied by clonotype groups that were categorized based on clonotype abundance rank. <bold>(G)</bold> Proportional abundance of clonotypes categorized by their prevalence across three samples. <bold>(H)</bold> Barplot showing mean counts of individual amino acids in the CDR3. <bold>(C, H)</bold> Mean &#xb1; 95% confidence intervals; Means not sharing any letter are significantly different by the Tukey-test at the 5% level of significance.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g007.tif"/>
</fig>
<p>The TCR &#x3b3; repertoire displayed a distinct hierarchical pattern in gene utilization, featuring infrequent TCRs from TRGV1 and TRGV4, moderate levels of TRGV2-derived sequences, and a high frequency (60 - 80%) of clonotypes originating from TRGV3 family V genes (<xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8A, C</bold>
</xref>). Similarly, TRGJ1, TRGJ2 and TRGJ3 exhibited analogous trends, with mean frequencies of 1.6%, 34.8% and 63.6%, respectively (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8B</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;6C</bold>
</xref>). The most frequently expressed V&#x3b3; genes were TRGV2-26, TRGV3-6, and TRGV3-5, each predominantly paired with TRGJ3 (<xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8A, D</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;5C, 12</bold>
</xref>). The CDR3 spectratype resembled an unbiased repertoire with a Gaussian-like distribution, featuring a long tail of low-frequency &#x201c;ultralong&#x201d; CDR3&#x3b3;s, as previously described by Zhang et&#xa0;al. (<xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8E</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;8G&#x2013;I</bold>
</xref>) (<xref ref-type="bibr" rid="B23">23</xref>). The top 10 clonotypes collectively represented approximately 2 - 2.5% of the TCRs. Individual clonotypes were moderately expanded, occupying up to 0.63% of the repertoire space. The relative frequency of the most frequent clonotypes was strikingly similar across all three samples (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8F</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;9G&#x2013;I</bold>
</xref>). The distribution of public and private clonotypes mirrored that of the TCR &#x3b1; sequences, comprising 10% found across three samples, while ~80% were private TCRs (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8G</bold>
</xref>). A substantial level of convergence was evident, with up to 13 distinct clonotypes encoding identical CDR3 sequences, accompanied by a notable publicness among convergent clonotypes (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;10E, F</bold>
</xref>). The CDR3 amino acid utilization was strongly biased towards tyrosine residues, representing 23.9% of all amino acids in &#x3b3; chains TCRs (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8H</bold>
</xref>).</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>The TCR &#x3b3; chain repertoire expressed in the chicken spleen. TCR &#x3b3; chain amplicons were sequenced at 2x300 bp, followed by alignment and clonotype assembly using <italic>MiXCR</italic> software with a VDJ germline library comprised of the sequences annotated in this study. <bold>(A)</bold> Clustermap displaying V gene utilization for each sample featuring gene counts and color-coded relative frequencies in the heatmap. Row colors denote V family: green (TRGV1), yellow (TRGV2), red (TRGV3), blue (TRGV4). <bold>(B)</bold> Clustermap displaying J gene utilization for each sample featuring gene counts and color-coded relative frequencies in the heatmap. <bold>(C)</bold> Log count of TCR clonotypes grouped by V family in the TCR &#x3b3; chain repertoire. <bold>(D)</bold> Bubble grid plot illustrating relative frequencies of V-J pairings, indicated by bubble size and color-coding. <bold>(E)</bold> CDR3 spectratype displaying the distribution of CDR3 amino acids lengths with frequency-weighted counts. <bold>(F)</bold> Rank abundance plot depicting the proportion of the TCR repertoire occupied by clonotype groups arranged by clonotype abundance rank. <bold>(G)</bold> Proportional abundance of clonotypes categorized by their prevalence across three samples. <bold>(H)</bold> Barplot showing mean counts of individual amino acids in the CDR3. <bold>(C, H)</bold> Mean &#xb1; 95% confidence intervals; Means not sharing any letter are significantly different by the Tukey-test at the 5% level of significance.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g008.tif"/>
</fig>
<p>Various V gene families contributed to TCR &#x3b4; sequences, with high expression of TRDV1-derived sequences, intermediate levels of TRDV2-family TCRs and infrequent expression of TRDV3, TRDV4 and TRDV5 (<xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9A, C</bold>
</xref>). Notably, approximately every 4<sup>th</sup> - 5<sup>th</sup> TCR was a chimeric receptor formed by somatic DNA recombination of TCR &#x3b4; DJ-C genes with TRAV1, TRAV2 or TRAV3 V genes. In this dataset, 28 V&#x3b1; genes contributed to the TCR &#x3b4; repertoire (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9D</bold>
</xref>). Top V genes TRDV1-25 and TRDV1-11 were predominantly recombined to TRDJ1 (<xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9A, B, D</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;5D, 6D, 13</bold>
</xref>). Similar to the other chains, the TCR &#x3b4; repertoire was phenotypically unbiased with no dominant clonotypes (<xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9E, F</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;8J&#x2013;L, 9J&#x2013;L</bold>
</xref>). The CDR3 regions were longer in &#x3b4; chain TCRs (distribution centered at 16-17 amino acids) and most clonotypes were private with low convergence levels (<xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9E, G</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;10G, H</bold>
</xref>). Unlike in the &#x3b3; chain CDR3, the tyrosine content in TCR &#x3b4; CDR3s was low, indicating that the two chains each contribute different binding properties to the CDR3 peptide binding groove in many &#x3b3;&#x3b4; TCRs (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9H</bold>
</xref>). Our analysis pipeline consistently delivered reproducible results across three biological replicates for all TCR chains.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>The TCR &#x3b4; chain repertoire expressed in the chicken spleen. TCR &#x3b4; chain amplicons were sequenced at 2x300 bp, followed by alignment and clonotype assembly using <italic>MiXCR</italic> software with a VDJ germline library comprised of the sequences annotated in this study. <bold>(A)</bold> Clustermap displaying V gene utilization for each sample featuring gene counts and color-coded relative frequencies in the heatmap. Row colors denote V family: green (TRDV1), yellow (TRDV2), red (TRDV3), blue (TRDV4), orange (TRDV5), grey (non-TRD V gene). <bold>(B)</bold> Clustermap displaying J gene utilization for each sample featuring gene counts and color-coded relative frequencies in the heatmap. <bold>(C)</bold> Log count of TCR clonotypes grouped by V family in the TCR &#x3b4; chain repertoire. <bold>(D)</bold> Bubble grid plot illustrating relative frequencies of V-J pairings, indicated by bubble size and color-coding. <bold>(E)</bold> CDR3 spectratype displaying the distribution of CDR3 amino acids lengths with frequency-weighted counts. <bold>(F)</bold> Rank abundance plot depicting the proportion of the TCR repertoire occupied by clonotype groups arranged by clonotype abundance rank. <bold>(G)</bold> Proportional abundance of clonotypes categorized by their prevalence across three samples. <bold>(H)</bold> Barplot showing mean counts of individual amino acids in the CDR3. <bold>(C, H)</bold> Mean &#xb1; 95% confidence intervals; Means not sharing any letter are significantly different by the Tukey-test at the 5% level of significance.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-15-1359169-g009.tif"/>
</fig>
<p>In summary, we delineated fundamental traits of the unbiased &#x3b1;&#x3b2; and &#x3b3;&#x3b4; T cell repertoires in the chicken spleen. The analysis encompassing the chicken TCR V(D)J germline genes along with the corresponding expressed TCR sequences has, for the first time, been comprehensively established across all four TCR chains. Our findings lay the groundwork for further investigations that will elucidate chicken T cell functions in infection and immunity.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>TCR repertoire sequencing, in conjunction with advances in NGS technology, has emerged as a key for understanding T cell biology and the dynamic composition of the T cell population. Most human repertoire studies focused on &#x3b1;&#x3b2; T cells, because &#x3b3;&#x3b4; T cells are present at low frequencies in the peripheral blood and other tissues. Specifically, the &#x3b2; chain CDR3 is the main target of human repertoire sequencing projects due to its high combinatorial diversity and important role in peptide binding (<xref ref-type="bibr" rid="B73">73</xref>). Considering the high frequency of &#x3b3;&#x3b4; T cells and the overall poorly characterized T cell responses in chickens, we concluded that an approach encompassing both &#x3b1;&#x3b2; and &#x3b3;&#x3b4; T cell repertoires is essential. This comprehensive analysis is crucial for addressing questions regarding the roles of chicken T cells in homeostasis, vaccination, and infection. However, this analysis has been hampered by a lack of publicly available annotations for TCR &#x3b1;/&#x3b4; V(D)J sequences.</p>
<p>To address this gap of knowledge, we established a comprehensive and standardized annotation across all TCR loci in the high-quality Huxu chicken genome assembly, including the TCR &#x3b1;/&#x3b4; hybrid locus on chromosome 27 (<xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f3">
<bold>3</bold>
</xref>) (<xref ref-type="bibr" rid="B34">34</xref>). We initially attempted to annotate the TCR loci in the current reference genomes <italic>bGalGal1.mat.broiler.GRCg7b</italic> and <italic>bGalGal1.pat.whiteleghornlayer.GRCg7w_WZ</italic> (two haplotypes of a cross between a modern broiler breeder mother and White Leghorn father), but noticed that the TCR sequences on chromosome 27 appeared to be incorrectly distributed between the two haplotypes (data not shown). In need of a tool to quickly assess the TCR loci in alternative genomes, we developed <italic>VJ-gene-finder</italic>, enabling automated VJ gene extraction. With an increasing number of new high-quality genomes being released for various chicken breeds, this tool represents a significant step towards an efficient and reproducible annotation of chicken TCR V(D)J genes across genomic datasets (between January and November 2023, 7 new genome assemblies were published on NCBI: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/datasets/genome/?taxon=9031">https://www.ncbi.nlm.nih.gov/datasets/genome/?taxon=9031</ext-link>).</p>
<p>
<italic>VJ-gene-finder</italic> (v0.1) identified 97% of F&amp;ORF V genes and 91% of all F&amp;ORF J genes that were characterized as part of this study. Yet, <italic>VJ-gene-finder</italic> lacks functionality for identification of D genes and pseudogenes. With the chicken genome bearing only three known D genes (1 TRBD and 2 TRDD genes), however, manual annotation is straightforward. Annotation of pseudogenes, on the other hand, is not strictly required for TCR analysis since pseudogenes lack essential features and do not contribute to the expressed repertoire. We manually curated <italic>VJ-gene-finder</italic> results, involving the removal of unspecific hits outside of the TCR loci, refining the start - and end positions of genes and associated features, as well as classification of functionality. Insights gained from the annotation process will guide potential iterations of <italic>VJ-gene-finder</italic>, facilitating its further development and refinement. The current algorithm was specifically designed for chicken TCR sequences. However, the search criteria rely on broadly conserved features across species and can be readily adapted for diverse species. For this purpose, <italic>VJ-gene-finder</italic> is now freely available as open-source software.</p>
<p>This work offers crucial insights into chicken TCR loci. Additionally, we present a comprehensive report on our chicken-specific TCR repertoire pipeline, including the repertoire in the spleen. We incorporated molecular barcoding in our pipeline for more precise quantification of the expressed TCR chains. Collectively, this study will lay the foundation for future TCR repertoire analyses in chickens, facilitating systematic comparisons across tissues, chicken breeds (such as broiler and layer chickens), and exploring repertoire dynamics during infection.</p>
<p>The V(D)JC annotation outlined in this study extends beyond previous annotations of the TCR &#x3b1;/&#x3b4; locus (<xref ref-type="bibr" rid="B14">14</xref>, <xref ref-type="bibr" rid="B19">19</xref>). Genome annotation results can vary based on genome quality and annotation methods. Given the rapid advancements in these domains, this discussion focuses on more recent studies. Parra and Miller annotated the chicken TCR &#x3b1;/&#x3b4; in the red jungle fowl genome released in 2004 (<xref ref-type="bibr" rid="B14">14</xref>). They described 41 V&#x3b1;1 genes, 19 V&#x3b1;2 genes, 36 V&#x3b4;1 genes, 2 D&#x3b4; genes, 2 J&#x3b4; genes, and 48 J&#x3b1; genes within a ~800 kb locus on chromosome 27. Liu et&#xa0;al. sequenced BAC clones covering most of the TCR &#x3b1;/&#x3b4; locus and annotated VDJC genes, with gaps between BAC sequences filled using the <italic>galGal4</italic> genome. They detected 54 V&#x3b1; genes (10 families) and 31 V&#x3b4; genes (4 families), 2 D&#x3b4; genes, 2 J&#x3b4; genes and 67 J&#x3b1; genes in the ~800 kb locus. Unfortunately, both studies lacked a detailed map of gene positions in the reference sequence, and the VDJ sequences themselves were also not published. In comparison, the locus in the Huxu genome was larger, spanning almost 1000 kb, while the overall architecture was similar. Accordingly, the locus contained a higher number of V genes compared to previous reports by Parra and Miller, and Liu et&#xa0;al., with a total of 72 V&#x3b1; genes in three families and 57 V&#x3b4; genes in 5 families, and no major differences in J and D genes (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>). Liu et&#xa0;al. described two V&#x3b1; genes within the &#x3b4; locus, which likely correspond to TRDV5 family members in our annotation (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). The phylogenetic tree indicated that the sequences were evolutionarily more closely related to V&#x3b1; genes (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). However, despite the proximity, no expression of these genes was identified within the &#x3b1; repertoire, and the sequences were located within the &#x3b4; locus, prompting our classification of them as TRDV genes. To facilitate better comparability, comprehensive sequence information is provided in the <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Data</bold>
</xref> section.</p>
<p>A recent study by Zhang <italic>at al.</italic> characterized the TCR &#x3b2; locus in the red jungle fowl <italic>GRCg6a</italic> genomes, reporting more V genes than existing annotations (<xref ref-type="bibr" rid="B18">18</xref>&#x2013;<xref ref-type="bibr" rid="B20">20</xref>). The genomic map of the TCR &#x3b2; locus in the Huxu genome closely resembled the locus structure reported by Zhang et&#xa0;al., with a total of 11 V&#x3b2;1 genes, 4 V&#x3b2;2 genes (one positioned downstream of the C gene in an inverted manner), 1 V&#x3b2;3 gene, 1 D&#x3b2; gene and 4 J&#x3b2; genes (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>) (<xref ref-type="bibr" rid="B20">20</xref>). One V&#x3b2;1 gene was a pseudogene in the <italic>GRCg6a</italic> assembly, while all V&#x3b2; genes were functional in the Huxu genome. Zhang et&#xa0;al. named genes in ascending order away from the C gene. We propose to adhere to earlier conventions, naming the genes in 5&#x2019; - 3&#x2019; direction leading up to the C gene in the genomic organization (<xref ref-type="bibr" rid="B18">18</xref>, <xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B74">74</xref>). A comparative analysis of TCR &#x3b2; V(D)J sequences reported by Zhang et&#xa0;al. with those annotated in our study revealed complete nucleotide identity only in D and J genes, along with the V&#x3b2;3 gene (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;2</bold>
</xref>). Notably, direct pairwise comparisons between red jungle fowl genes and Huxu genes did not consistently result in a one-to-one match; some Huxu genes emerged as the best match multiple times, while others were never identified as the best match. This variability suggests variations in TCR genes between chicken lines.</p>
<p>Three recent studies published annotations of the TCR &#x3b3; locus, with varying numbers of V genes and families (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>). Liu et&#xa0;al. reported 37 V&#x3b3; genes (11 families) based on BAC sequencing and the <italic>galGal4</italic> genome. The other two studies were both based on the <italic>GRCg6a</italic> genome assembly. Dixon et&#xa0;al. partially addressed a discrepancy concerning a potentially duplicated 15 kb sequence fragment containing 13&#xa0;V genes in the <italic>GRCg6a</italic> genome assembly, which seemed to have been excluded from the published annotation. This duplication was not discussed in the other study. Nonetheless, both studies reached similar conclusions regarding the number of TCR genes: Zhang et&#xa0;al. identified 44 V&#x3b3; in 6 distinct subgroups (<italic>GRCg6a</italic> genome), while Dixon et&#xa0;al. described 40 V&#x3b3; genes in 4 families. In this study, we characterized 53 V&#x3b3; genes, 9 of which were short remnant fragments with an RSS. Those would have likely been disregarded in other studies, leading to 44 remaining full-length V&#x3b3; genes organized in 4 families. These numbers overall align with previous work. In summary, multiple studies have provided consistent findings regarding the general organization of the locus, including the counts of D, J and C genes. However, discrepancies arise notably in the count of V genes. Comprehensive reporting of annotated sequences and the corresponding reference sequence becomes pivotal for facilitating direct comparisons among studies and, consequently, establishing a standardized nomenclature. For future comparative analyses, we conducted a comparison of TCR &#x3b3; V(D)J genes reported by Zhang et&#xa0;al. with those annotated in our study (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;3</bold>
</xref>). Similar to the TRB sequences, only J genes and some V genes exhibited 100% identity, and the sequences did not consistently match one-to-one in the red jungle fowl and Huxu genomes.</p>
<p>The evolutionary history of TCR loci is characterized by expansion, leading to diversification of the TCR repertoire. At the same time, evolutionary constraints lead to conserved sequences, residues and motifs that are essential for TCR genes, somatic DNA recombination, and the TCR structure. Those were the patterns that we aimed to identify with the search algorithm incorporated in <italic>VJ-gene-finder</italic>. The processes that shaped the evolution of TCR sequences likely were a complex combination of duplications, insertions, deletions, and gene conversion (<xref ref-type="bibr" rid="B69">69</xref>). The more distantly related genes in different V families and the highly similar sequences within gene families are an example of ancient and recent duplications. Overall, we found evidence for multiple duplications of specific homology units in all TCR loci.</p>
<p>In the TCR repertoire analyses of the spleen several general patterns emerged. First, the repertoires in the spleen were predominantly unbiased with Gaussian-like spectratypes. Second, clonotypes were predominantly rare, with moderately expanded clonotypes (&lt;1% of the repertoire space) found in &#x3b3; repertoires, and, to a lesser degree in &#x3b1; repertoires. Third, V and J gene utilization was strongly biased in all chains, except for TRBJ genes that were all commonly expressed in &#x3b2; chains. Several factors could contribute to variable expression, including the sequence of the RSS itself. Moreover, other sequence motifs in upstream noncoding regions of TCR genes, such as CRE and R-tract motifs, could control V gene expression (<xref ref-type="bibr" rid="B69">69</xref>). Observed biases in various tissues could also be a function of thymic positive and negative selection, differential homing properties and selective expansion upon tissue-specific stimuli. The fourth pattern was that chimeric receptors occurred frequently in the &#x3b4; repertoire and infrequently in the &#x3b1; repertoire. Fifth, a significant proportion of &#x3b3; and &#x3b1; clonotypes was public, while &#x3b2; and &#x3b4; (the D-gene containing chains) were predominantly private (at this sequencing depth). Sixth, the top 10 most frequent clonotypes occurred at similar frequencies in &#x3b1; and &#x3b3; repertoires, but not in &#x3b2; and &#x3b4; chains. In addition, rank abundance plots indicated that the top 100 clone groups occupied larger proportions of the &#x3b3; and &#x3b1; repertoires, pointing towards overall more (moderately) expanded clones. Several expanded clones, notably within the &#x3b3; repertoire, exhibited significant convergence, suggesting preferential selection of specific CDR3 amino acid sequences.</p>
<p>Finally, amino acids showed variable prevalence in CDR3s of each chain, with a striking bias towards tyrosine residues in &#x3b3; chains (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8H</bold>
</xref>). While tyrosine residues are not generally overrepresented in human and mouse &#x3b1;&#x3b2; TCR CDR3s, they are significantly enriched in immunoglobulin CDR3s. Specifically in murine CDR-H3s, the proportion of tyrosine residues reached 25%, akin to the relative frequency observed in chicken &#x3b3; chains (<xref ref-type="bibr" rid="B75">75</xref>&#x2013;<xref ref-type="bibr" rid="B77">77</xref>). This bias was attributed to the advantageous physiochemical properties of the tyrosine aromatic side chains, permitting flexible molecular interactions at the antigen binding sites (<xref ref-type="bibr" rid="B75">75</xref>, <xref ref-type="bibr" rid="B78">78</xref>). Consequently, a higher tyrosine content in CDR3s would facilitate binding of a wider range of (structurally diverse) ligands. This raises important questions about the nature of &#x3b3;&#x3b4; TCR ligands, which may or may not be restricted to peptide-MHCI/II complexes. Ultimately, conducting structural analysis of the chicken &#x3b3;&#x3b4; TCR, akin to the &#x3b1;&#x3b2; TCR, and identifying its ligands are essential steps towards analysing the antigen recognition of the &#x3b3;&#x3b4; TCR (<xref ref-type="bibr" rid="B10">10</xref>).</p>
<p>Overall, our repertoire analyses broadly align with previous studies, although care is warranted when direct comparisons are drawn due to inherent biases from differences in experimental design, chicken breeds, genome annotations, tissues and methodology used (<xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>, <xref ref-type="bibr" rid="B29">29</xref>).</p>
<p>Several technical aspects need to be considered in the experimental design. We sequenced between 59172 and 131282 paired end reads per sample and chain. The successful alignment rate in <italic>MiXCR</italic> varied between chains (from ~70% to &gt; 95%), with the lowest success in &#x3b1; chain sequences. Based on an initial analysis of unaligned reads, our preliminary hypothesis is that many non-regular TCR sequences containing introns and/or UTRs were amplified along with functional TCRs during 5&#x2019; RACE amplification. Since this is a known phenomenon, a dedicated computational tool for the analysis of irregular TCRs was developed, which aligns TCR sequences directly to the genome (<xref ref-type="bibr" rid="B79">79</xref>). In our analysis, we excluded non-regular TCRs because the functional relevance of such alternative transcripts is unclear. Furthermore, a notable portion of sequences exhibited stop codons (&#x2264;1% in &#x3b1; and &#x3b2; chains and &#x2264;5% in &#x3b3; and &#x3b4; chains) or frameshift mutations (&#x2264;8% in &#x3b1; and &#x3b2; chains &#x2264;20% in &#x3b3; and &#x3b4; chains). We excluded such non-expressed TCRs in the post analysis. Together, these factors should be considered when estimating the desired sequencing depth. Notably, UMI-based PCR error correction is powerful, but a high sequencing coverage is required (<xref ref-type="bibr" rid="B80">80</xref>).</p>
<p>Bulk TCR repertoire analysis, as described here, represents a fast, accurate and powerful method for conducting an in-depth characterization of T cell responses. Compared to emerging single-cell technologies, bulk TCR repertoire sequencing can be used to sequence very deeply for the analysis of low-frequency clones, but the paring of &#x3b1;&#x3b2; and &#x3b3;&#x3b4; chains can only be inferred. Regardless of single-cell or bulk analysis, of utmost importance will be to connect TCR sequence information to structural analysis and ligand identification. Studies focusing on antigen-specific responses will play a pivotal role in unravelling the roles of both &#x3b1;&#x3b2; and &#x3b3;&#x3b4; T cells within the adaptive immune responses of chickens.</p>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are publicly available. This data can be found here: [NCBI - PRJNA1068558].</p>
</sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The animal study was approved by Government of Upper Bavaria, identification code: 55.2-1-54-2532.0-60-2015; June, 2019. The study was conducted in accordance with the local legislation and institutional requirements.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>SF: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. MF: Software, Writing &#x2013; review &amp; editing. BK: Funding acquisition, Project administration, Resources, Supervision, Writing &#x2013; review &amp; editing. TG: Conceptualization, Funding acquisition, Project administration, Resources, Supervision, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This project was funded by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) in the framework of the Research Unit ImmunoChick (FOR5130) through the central. ImmunoChick funds (KA 3492/10-1) and the projects KA 3492/9-1 and GO 489/7-1 awarded to BK and TG.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>The authors would like to thank Prof. Bernd Kaspers for his support. The authors would also like to thank Anna Hegele for her contributions. ChatGPT (<ext-link ext-link-type="uri" xlink:href="https://chat.openai.com/">https://chat.openai.com/</ext-link>) was used to improve conciseness of language, with no contribution to the scientific content.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fimmu.2024.1359169/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fimmu.2024.1359169/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.csv" id="SF1" mimetype="text/csv"/>
<supplementary-material xlink:href="DataSheet_2.fasta" id="SF2" mimetype="text/x-fasta"/>
<supplementary-material xlink:href="DataSheet_3.csv" id="SF3" mimetype="text/csv"/>
<supplementary-material xlink:href="DataSheet_4.fasta" id="SF4" mimetype="text/x-fasta"/>
<supplementary-material xlink:href="DataSheet_5.csv" id="SF5" mimetype="text/csv"/>
<supplementary-material xlink:href="DataSheet_6.fasta" id="SF6" mimetype="text/x-fasta"/>
<supplementary-material xlink:href="DataSheet_7.zip" id="SM1" mimetype="application/zip"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sheridan</surname> <given-names>BS</given-names>
</name>
<name>
<surname>Romagnoli</surname> <given-names>PA</given-names>
</name>
<name>
<surname>Pham</surname> <given-names>Q-M</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>H-H</given-names>
</name>
<name>
<surname>Alonzo</surname> <given-names>F</given-names>
</name>
<name>
<surname>Schubert</surname> <given-names>W-D</given-names>
</name>
<etal/>
</person-group>. <article-title>&#x3b3;&#x3b4; T cells exhibit multifunctional and protective memory in intestinal tissues</article-title>. <source>Immunity</source>. (<year>2013</year>) <volume>39</volume>:<page-range>184&#x2013;95</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.immuni.2013.06.015</pub-id>
</citation>
</ref>
<ref id="B2">
<label>2</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fenzl</surname> <given-names>L</given-names>
</name>
<name>
<surname>G&#xf6;bel</surname> <given-names>TW</given-names>
</name>
<name>
<surname>Neulen</surname> <given-names>M-L</given-names>
</name>
</person-group>. <article-title>&#x3b3;&#x3b4; T cells represent a major spontaneously cytotoxic cell population in the chicken</article-title>. <source>Dev Comp Immunol</source>. (<year>2017</year>) <volume>73</volume>:<page-range>175&#x2013;83</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.dci.2017.03.028</pub-id>
</citation>
</ref>
<ref id="B3">
<label>3</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ribot</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Lopes</surname> <given-names>N</given-names>
</name>
<name>
<surname>Silva-Santos</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>&#x3b3;&#x3b4; T cells in tissue physiology and surveillance</article-title>. <source>Nat Rev Immunol</source>. (<year>2021</year>) <volume>21</volume>:<page-range>221&#x2013;32</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41577-020-00452-4</pub-id>
</citation>
</ref>
<ref id="B4">
<label>4</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Cihak</surname> <given-names>J</given-names>
</name>
<name>
<surname>L&#xf6;sch</surname> <given-names>U</given-names>
</name>
<name>
<surname>Cooper</surname> <given-names>MD</given-names>
</name>
</person-group>. <article-title>Differential expression of two T cell receptors, TcR1 and TcR2, on chicken lymphocytes</article-title>. <source>Eur J Immunol</source>. (<year>1988</year>) <volume>18</volume>:<page-range>539&#x2013;43</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/eji.1830180408</pub-id>
</citation>
</ref>
<ref id="B5">
<label>5</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Ager</surname> <given-names>LL</given-names>
</name>
<name>
<surname>Gartland</surname> <given-names>GL</given-names>
</name>
<name>
<surname>Cooper</surname> <given-names>MD</given-names>
</name>
</person-group>. <article-title>Identification of a T3/T cell receptor complex in chickens</article-title>. <source>J Exp Med</source>. (<year>1986</year>) <volume>164</volume>:<page-range>375&#x2013;80</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1084/jem.164.1.375</pub-id>
</citation>
</ref>
<ref id="B6">
<label>6</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chan</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Ager</surname> <given-names>LL</given-names>
</name>
<name>
<surname>Cooper</surname> <given-names>MD</given-names>
</name>
</person-group>. <article-title>Identification of the avian homologues of mammalian CD4 and CD8 antigens</article-title>. <source>J Immunol</source>. (<year>1988</year>) <volume>140</volume>:<page-range>2133&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.4049/jimmunol.140.7.2133</pub-id>
</citation>
</ref>
<ref id="B7">
<label>7</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cihak</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ziegler-Heitbrock</surname> <given-names>HWL</given-names>
</name>
<name>
<surname>Trainer</surname> <given-names>H</given-names>
</name>
<name>
<surname>Merkenschlager</surname> <given-names>M</given-names>
</name>
<name>
<surname>L&#xf6;sch</surname> <given-names>U</given-names>
</name>
</person-group>. <article-title>Characterization and functional properties of a novel monoclonal antibody which identifies a T cell receptor in chickens</article-title>. <source>Eur J Immunol</source>. (<year>1988</year>) <volume>18</volume>:<page-range>533&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/eji.1830180407</pub-id>
</citation>
</ref>
<ref id="B8">
<label>8</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sowder</surname> <given-names>JT</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Ager</surname> <given-names>LL</given-names>
</name>
<name>
<surname>Chan</surname> <given-names>MM</given-names>
</name>
<name>
<surname>Cooper</surname> <given-names>MD</given-names>
</name>
</person-group>. <article-title>A large subpopulation of avian T cells express a homologue of the mammalian T gamma/delta receptor</article-title>. <source>J Exp Med</source>. (<year>1988</year>) <volume>167</volume>:<page-range>315&#x2013;22</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1084/jem.167.2.315</pub-id>
</citation>
</ref>
<ref id="B9">
<label>9</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Char</surname> <given-names>D</given-names>
</name>
<name>
<surname>Sanchez</surname> <given-names>P</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Bucy</surname> <given-names>RP</given-names>
</name>
<name>
<surname>Cooper</surname> <given-names>MD</given-names>
</name>
</person-group>. <article-title>A third sublineage of avian T cells can be identified with a T cell receptor-3-specific antibody</article-title>. <source>J Immunol.</source> (<year>1990</year>) <volume>145</volume>(<issue>11</issue>):<fpage>3547</fpage>&#x2013;<lpage>55</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4049/jimmunol.145.11.3547</pub-id>
</citation>
</ref>
<ref id="B10">
<label>10</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Meng</surname> <given-names>G</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>R</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>B</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>Structural and biophysical insights into the TCR&#x3b1;&#x3b2; Complex in chickens</article-title>. <source>iScience</source>. (<year>2020</year>) <volume>23</volume>:<elocation-id>101828</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.isci.2020.101828</pub-id>
</citation>
</ref>
<ref id="B11">
<label>11</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lefranc</surname> <given-names>M-P</given-names>
</name>
<name>
<surname>Pommi&#xe9;</surname> <given-names>C</given-names>
</name>
<name>
<surname>Ruiz</surname> <given-names>M</given-names>
</name>
<name>
<surname>Giudicelli</surname> <given-names>V</given-names>
</name>
<name>
<surname>Foulquier</surname> <given-names>E</given-names>
</name>
<name>
<surname>Truong</surname> <given-names>L</given-names>
</name>
<etal/>
</person-group>. <article-title>IMGT unique numbering for immunoglobulin and T cell receptor variable domains and Ig superfamily V-like domains</article-title>. <source>Dev Comp Immunol</source>. (<year>2003</year>) <volume>27</volume>:<fpage>55</fpage>&#x2013;<lpage>77</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0145-305X(02)00039-3</pub-id>
</citation>
</ref>
<ref id="B12">
<label>12</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schatz</surname> <given-names>DG</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Recombination centres and the orchestration of V(D)J recombination</article-title>. <source>Nat Rev Immunol</source>. (<year>2011</year>) <volume>11</volume>:<page-range>251&#x2013;63</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nri2941</pub-id>
</citation>
</ref>
<ref id="B13">
<label>13</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>G&#xf6;bel</surname> <given-names>TW</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Lahti</surname> <given-names>J</given-names>
</name>
<name>
<surname>Kubota</surname> <given-names>T</given-names>
</name>
<name>
<surname>Kuo</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Aebersold</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Identification of T-cell receptor alpha-chain genes in the chicken</article-title>. <source>Proc Natl Acad Sci USA</source>. (<year>1994</year>) <volume>91</volume>:<page-range>1094&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.91.3.1094</pub-id>
</citation>
</ref>
<ref id="B14">
<label>14</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parra</surname> <given-names>ZE</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>RD</given-names>
</name>
</person-group>. <article-title>Comparative analysis of the chicken TCR&#x3b1;/&#x3b4; locus</article-title>. <source>Immunogenetics</source>. (<year>2012</year>) <volume>64</volume>:<page-range>641&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00251-012-0621-5</pub-id>
</citation>
</ref>
<ref id="B15">
<label>15</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rossjohn</surname> <given-names>J</given-names>
</name>
<name>
<surname>Gras</surname> <given-names>S</given-names>
</name>
<name>
<surname>Miles</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Turner</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Godfrey</surname> <given-names>DI</given-names>
</name>
<name>
<surname>McCluskey</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>T cell antigen receptor recognition of antigen-presenting molecules</article-title>. <source>Annu Rev Immunol</source>. (<year>2015</year>) <volume>33</volume>:<fpage>169</fpage>&#x2013;<lpage>200</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev-immunol-032414-112334</pub-id>
</citation>
</ref>
<ref id="B16">
<label>16</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tjoelker</surname> <given-names>LW</given-names>
</name>
<name>
<surname>Carlson</surname> <given-names>LM</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>K</given-names>
</name>
<name>
<surname>Lahti</surname> <given-names>J</given-names>
</name>
<name>
<surname>McCormack</surname> <given-names>WT</given-names>
</name>
<name>
<surname>Leiden</surname> <given-names>JM</given-names>
</name>
<etal/>
</person-group>. <article-title>Evolutionary conservation of antigen recognition: the chicken T-cell receptor beta chain</article-title>. <source>Proc Natl Acad Sci USA</source>. (<year>1990</year>) <volume>87</volume>:<page-range>7856&#x2013;60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.87.20.7856</pub-id>
</citation>
</ref>
<ref id="B17">
<label>17</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lahti</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>CL</given-names>
</name>
<name>
<surname>Tjoelker</surname> <given-names>LW</given-names>
</name>
<name>
<surname>Pickel</surname> <given-names>JM</given-names>
</name>
<name>
<surname>Schat</surname> <given-names>KA</given-names>
</name>
<name>
<surname>Calnek</surname> <given-names>BW</given-names>
</name>
<etal/>
</person-group>. <article-title>Two distinct alpha beta T-cell lineages can be distinguished by the differential usage of T-cell receptor V beta gene segments</article-title>. <source>Proc Natl Acad Sci USA</source>. (<year>1991</year>) <volume>88</volume>:<page-range>10956&#x2013;60</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.88.23.10956</pub-id>
</citation>
</ref>
<ref id="B18">
<label>18</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mwangi</surname> <given-names>WN</given-names>
</name>
<name>
<surname>Beal</surname> <given-names>RK</given-names>
</name>
<name>
<surname>Powers</surname> <given-names>C</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>X</given-names>
</name>
<name>
<surname>Humphrey</surname> <given-names>T</given-names>
</name>
<name>
<surname>Watson</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>Regional and global changes in TCR&#x3b1;&#x3b2; T cell repertoires in the gut are dependent upon the complexity of the enteric microflora</article-title>. <source>Dev Comp Immunol</source>. (<year>2010</year>) <volume>34</volume>:<page-range>406&#x2013;17</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.dci.2009.11.009</pub-id>
</citation>
</ref>
<ref id="B19">
<label>19</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>F</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>IYC</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>X</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>J</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>The genome resequencing of TCR loci in gallus gallus revealed their distinct evolutionary features in avians</article-title>. <source>ImmunoHorizons</source>. (<year>2020</year>) <volume>4</volume>:<fpage>33</fpage>&#x2013;<lpage>46</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4049/immunohorizons.1900095</pub-id>
</citation>
</ref>
<ref id="B20">
<label>20</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>T</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>G</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Genomic organization of the chicken TCR&#x3b2; locus originated by duplication of a V&#x3b2; segment combined with a trypsinogen gene&#x2019;</article-title>. <source>Vet Immunol Immunopathol</source>. (<year>2020</year>) <volume>219</volume>:<elocation-id>109974</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.vetimm.2019.109974</pub-id>
</citation>
</ref>
<ref id="B21">
<label>21</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Six</surname> <given-names>A</given-names>
</name>
<name>
<surname>Rast</surname> <given-names>JP</given-names>
</name>
<name>
<surname>McCormack</surname> <given-names>WT</given-names>
</name>
<name>
<surname>Dunon</surname> <given-names>D</given-names>
</name>
<name>
<surname>Courtois</surname> <given-names>D</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y</given-names>
</name>
<etal/>
</person-group>. <article-title>Characterization of avian T-cell receptor &#x3b3; genes</article-title>. <source>Proc Natl Acad Sci USA</source>. (<year>1996</year>) <volume>93</volume>:<page-range>15329&#x2013;34</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.93.26.15329</pub-id>
</citation>
</ref>
<ref id="B22">
<label>22</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dixon</surname> <given-names>R</given-names>
</name>
<name>
<surname>Preston</surname> <given-names>SG</given-names>
</name>
<name>
<surname>Dascalu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Flammer</surname> <given-names>PG</given-names>
</name>
<name>
<surname>Fiddaman</surname> <given-names>SR</given-names>
</name>
<name>
<surname>McLoughlin</surname> <given-names>K</given-names>
</name>
<etal/>
</person-group>. <article-title>Repertoire analysis of &#x3b3;&#x3b4; T cells in the chicken enables functional annotation of the genomic region revealing highly variable pan-tissue TCR gamma V gene usage as well as identifying public and private repertoires</article-title>. <source>BMC Genomics</source>. (<year>2021</year>) <volume>22</volume>:<fpage>719</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-021-08036-9</pub-id>
</citation>
</ref>
<ref id="B23">
<label>23</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>T</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>L</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>Y</given-names>
</name>
</person-group>. <article-title>Characterization of the chicken T cell receptor &#x3b3; repertoire by high-throughput sequencing</article-title>. <source>BMC Genomics</source>. (<year>2021</year>) <volume>22</volume>:<fpage>683</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-021-07975-7</pub-id>
</citation>
</ref>
<ref id="B24">
<label>24</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kubota</surname> <given-names>T</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J</given-names>
</name>
<name>
<surname>G&#xf6;bel</surname> <given-names>TW</given-names>
</name>
<name>
<surname>Hockett</surname> <given-names>RD</given-names>
</name>
<name>
<surname>Cooper</surname> <given-names>MD</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>CH</given-names>
</name>
</person-group>. <article-title>Characterization of an avian (Gallus gallus domesticus) TCR &#x3b1;&#x3b4; gene locus</article-title>. <source>J Immunol</source>. (<year>1999</year>) <volume>163</volume>:<page-range>3858&#x2013;66</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.4049/jimmunol.163.7.3858</pub-id>
</citation>
</ref>
<ref id="B25">
<label>25</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parra</surname> <given-names>ZE</given-names>
</name>
<name>
<surname>Mitchell</surname> <given-names>K</given-names>
</name>
<name>
<surname>Dalloul</surname> <given-names>RA</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>RD</given-names>
</name>
</person-group>. <article-title>A second TCR&#x3b4; Locus in galliformes uses antibody-like V domains: insight into the evolution of TCR&#x3b4; and TCR&#x3bc; Genes in tetrapods</article-title>. <source>J Immunol</source>. (<year>2012</year>) <volume>188</volume>:<page-range>3912&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.4049/jimmunol.1103521</pub-id>
</citation>
</ref>
<ref id="B26">
<label>26</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lefranc</surname> <given-names>M-P</given-names>
</name>
</person-group>. <article-title>IMGT (ImMunoGeneTics) locus on focus. A new section of Experimental and Clinical Immunogenetics</article-title>. <source>Exp Clin Immunogenetics</source>. (<year>1998</year>) <volume>15</volume>:<fpage>1</fpage>&#x2013;<lpage>7</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1159/000019049</pub-id>
</citation>
</ref>
<ref id="B27">
<label>27</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Britanova</surname> <given-names>OV</given-names>
</name>
<name>
<surname>Putintseva</surname> <given-names>EV</given-names>
</name>
<name>
<surname>Shugay</surname> <given-names>M</given-names>
</name>
<name>
<surname>Merzlyak</surname> <given-names>EM</given-names>
</name>
<name>
<surname>Turchaninova</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Staroverov</surname> <given-names>DB</given-names>
</name>
<etal/>
</person-group>. <article-title>Age-related decrease in TCR repertoire diversity measured with deep and normalized sequence profiling</article-title>. <source>J Immunol</source>. (<year>2014</year>) <volume>192</volume>:<page-range>2689&#x2013;98</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.4049/jimmunol.1302064</pub-id>
</citation>
</ref>
<ref id="B28">
<label>28</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Minervina</surname> <given-names>AA</given-names>
</name>
<name>
<surname>Pogorelyy</surname> <given-names>MV</given-names>
</name>
<name>
<surname>Komech</surname> <given-names>EA</given-names>
</name>
<name>
<surname>Karnaukhov</surname> <given-names>VK</given-names>
</name>
<name>
<surname>Bacher</surname> <given-names>P</given-names>
</name>
<name>
<surname>Rosati</surname> <given-names>E</given-names>
</name>
<etal/>
</person-group>. <article-title>Primary and secondary anti-viral response captured by the dynamics and phenotype of individual T cell clones</article-title>. <source>eLife</source>. (<year>2020</year>) <volume>9</volume>:<elocation-id>e53704</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.7554/eLife.53704</pub-id>
</citation>
</ref>
<ref id="B29">
<label>29</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dascalu</surname> <given-names>S</given-names>
</name>
<name>
<surname>Preston</surname> <given-names>SG</given-names>
</name>
<name>
<surname>Dixon</surname> <given-names>RJ</given-names>
</name>
<name>
<surname>Flammer</surname> <given-names>PG</given-names>
</name>
<name>
<surname>Fiddaman</surname> <given-names>S</given-names>
</name>
<name>
<surname>Boyd</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>The influences of microbial colonisation and germ-free status on the chicken TCR&#x3b2; repertoire</article-title>. <source>Front Immunol</source>. (<year>2023</year>) <volume>13</volume>:<elocation-id>1052297</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fimmu.2022.1052297</pub-id>
</citation>
</ref>
<ref id="B30">
<label>30</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kivioja</surname> <given-names>T</given-names>
</name>
<name>
<surname>V&#xe4;h&#xe4;rautio</surname> <given-names>A</given-names>
</name>
<name>
<surname>Karlsson</surname> <given-names>K</given-names>
</name>
<name>
<surname>Bonke</surname> <given-names>M</given-names>
</name>
<name>
<surname>Enge</surname> <given-names>M</given-names>
</name>
<name>
<surname>Linnarsson</surname> <given-names>S</given-names>
</name>
<etal/>
</person-group>. <article-title>Counting absolute numbers of molecules using unique molecular identifiers</article-title>. <source>Nat Methods</source>. (<year>2012</year>) <volume>9</volume>:<page-range>72&#x2013;4</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.1778</pub-id>
</citation>
</ref>
<ref id="B31">
<label>31</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mamedov</surname> <given-names>IZ</given-names>
</name>
<name>
<surname>Britanova</surname> <given-names>OV</given-names>
</name>
<name>
<surname>Zvyagin</surname> <given-names>IV</given-names>
</name>
<name>
<surname>Turchaninova</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Bolotin</surname> <given-names>DA</given-names>
</name>
<name>
<surname>Putintseva</surname> <given-names>EV</given-names>
</name>
<etal/>
</person-group>. <article-title>Preparing unbiased T-cell receptor and antibody cDNA libraries for the deep next generation sequencing profiling</article-title>. <source>Front Immunol</source>. (<year>2013</year>) <volume>4</volume>:<elocation-id>456</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fimmu.2013.00456</pub-id>
</citation>
</ref>
<ref id="B32">
<label>32</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ye</surname> <given-names>J</given-names>
</name>
<name>
<surname>Coulouris</surname> <given-names>G</given-names>
</name>
<name>
<surname>Zaretskaya</surname> <given-names>I</given-names>
</name>
<name>
<surname>Cutcutache</surname> <given-names>I</given-names>
</name>
<name>
<surname>Rozen</surname> <given-names>S</given-names>
</name>
<name>
<surname>Madden</surname> <given-names>TL</given-names>
</name>
</person-group>. <article-title>Primer-BLAST: a tool to design target-specific primers for polymerase chain reaction</article-title>. <source>BMC Bioinf</source>. (<year>2012</year>) <volume>13</volume>:<elocation-id>134</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2105-13-134</pub-id>
</citation>
</ref>
<ref id="B33">
<label>33</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olivieri</surname> <given-names>D</given-names>
</name>
<name>
<surname>Faro</surname> <given-names>J</given-names>
</name>
<name>
<surname>von Haeften</surname> <given-names>B</given-names>
</name>
<name>
<surname>S&#xe1;nchez-Espinel</surname> <given-names>C</given-names>
</name>
<name>
<surname>Gamb&#xf3;n-Deza</surname> <given-names>F</given-names>
</name>
</person-group>. <article-title>An automated algorithm for extracting functional immunologic V-genes from genomes in jawed vertebrates</article-title>. <source>Immunogenetics</source>. (<year>2013</year>) <volume>65</volume>:<fpage>691</fpage>&#x2013;<lpage>702</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00251-013-0715-8</pub-id>
</citation>
</ref>
<ref id="B34">
<label>34</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Z</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>H</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>N</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>X</given-names>
</name>
<etal/>
</person-group>. <article-title>&#x2018;Evolutionary analysis of a complete chicken genome&#x2019;</article-title>. <source>Proc Natl Acad Sci USA</source>. (<year>2023</year>) <volume>120</volume>:<elocation-id>e2216641120</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2216641120</pub-id>
</citation>
</ref>
<ref id="B35">
<label>35</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Larkin</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Blackshields</surname> <given-names>G</given-names>
</name>
<name>
<surname>Brown</surname> <given-names>NP</given-names>
</name>
<name>
<surname>Chenna</surname> <given-names>R</given-names>
</name>
<name>
<surname>McGettigan</surname> <given-names>PA</given-names>
</name>
<name>
<surname>McWilliam</surname> <given-names>H</given-names>
</name>
<etal/>
</person-group>. <article-title>Clustal W and clustal X version 2.0</article-title>. <source>Bioinformatics</source>. (<year>2007</year>) <volume>23</volume>:<page-range>2947&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btm404</pub-id>
</citation>
</ref>
<ref id="B36">
<label>36</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Waterhouse</surname> <given-names>AM</given-names>
</name>
<name>
<surname>Procter</surname> <given-names>JB</given-names>
</name>
<name>
<surname>Martin</surname> <given-names>DMA</given-names>
</name>
<name>
<surname>Clamp</surname> <given-names>M</given-names>
</name>
<name>
<surname>Barton</surname> <given-names>GJ</given-names>
</name>
</person-group>. <article-title>Jalview Version 2&#x2013;a multiple sequence alignment editor and analysis workbench</article-title>. <source>Bioinformatics</source>. (<year>2009</year>) <volume>25</volume>:<page-range>1189&#x2013;91</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btp033</pub-id>
</citation>
</ref>
<ref id="B37">
<label>37</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sievers</surname> <given-names>F</given-names>
</name>
<name>
<surname>Wilm</surname> <given-names>A</given-names>
</name>
<name>
<surname>Dineen</surname> <given-names>D</given-names>
</name>
<name>
<surname>Gibson</surname> <given-names>TJ</given-names>
</name>
<name>
<surname>Karplus</surname> <given-names>K</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W</given-names>
</name>
<etal/>
</person-group>. <article-title>Fast, scalable generation of high-quality protein multiple sequence alignments using Clustal Omega</article-title>. <source>Mol Syst Biol</source>. (<year>2011</year>) <volume>7</volume>:<fpage>539</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/msb.2011.75</pub-id>
</citation>
</ref>
<ref id="B38">
<label>38</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carver</surname> <given-names>T</given-names>
</name>
<name>
<surname>Harris</surname> <given-names>SR</given-names>
</name>
<name>
<surname>Berriman</surname> <given-names>M</given-names>
</name>
<name>
<surname>Parkhill</surname> <given-names>J</given-names>
</name>
<name>
<surname>McQuillan</surname> <given-names>JA</given-names>
</name>
</person-group>. <article-title>Artemis: an integrated platform for visualization and analysis of high-throughput sequence-based experimental data</article-title>. <source>Bioinformatics</source>. (<year>2012</year>) <volume>28</volume>:<page-range>464&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btr703</pub-id>
</citation>
</ref>
<ref id="B39">
<label>39</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Merelli</surname> <given-names>I</given-names>
</name>
<name>
<surname>Guffanti</surname> <given-names>A</given-names>
</name>
<name>
<surname>Fabbri</surname> <given-names>M</given-names>
</name>
<name>
<surname>Cocito</surname> <given-names>A</given-names>
</name>
<name>
<surname>Furia</surname> <given-names>L</given-names>
</name>
<name>
<surname>Grazini</surname> <given-names>U</given-names>
</name>
<etal/>
</person-group>. <article-title>RSSsite: a reference database and prediction tool for the identification of cryptic Recombination Signal Sequences in human and murine genomes</article-title>. <source>Nucleic Acids Res</source>. (<year>2010</year>) <volume>38</volume>:<page-range>W262&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkq391</pub-id>
</citation>
</ref>
<ref id="B40">
<label>40</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scalzitti</surname> <given-names>N</given-names>
</name>
<name>
<surname>Kress</surname> <given-names>A</given-names>
</name>
<name>
<surname>Orhand</surname> <given-names>R</given-names>
</name>
<name>
<surname>Weber</surname> <given-names>T</given-names>
</name>
<name>
<surname>Moulinier</surname> <given-names>L</given-names>
</name>
<name>
<surname>Jeannin-Girardon</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Spliceator: multi-species splice site prediction using convolutional neural networks</article-title>. <source>BMC Bioinf</source>. (<year>2021</year>) <volume>22</volume>:<fpage>561</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12859-021-04471-3</pub-id>
</citation>
</ref>
<ref id="B41">
<label>41</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Teufel</surname> <given-names>F</given-names>
</name>
<name>
<surname>Almagro Armenteros</surname> <given-names>JJ</given-names>
</name>
<name>
<surname>Johansen</surname> <given-names>AR</given-names>
</name>
<name>
<surname>G&#xed;slason</surname> <given-names>MH</given-names>
</name>
<name>
<surname>Pihl</surname> <given-names>SI</given-names>
</name>
<name>
<surname>Tsirigos</surname> <given-names>KD</given-names>
</name>
<etal/>
</person-group>. <article-title>SignalP 6.0 predicts all five types of signal peptides using protein language models</article-title>. <source>Nat Biotechnol</source>. (<year>2022</year>) <volume>40</volume>:<page-range>1023&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41587-021-01156-3</pub-id>
</citation>
</ref>
<ref id="B42">
<label>42</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Langmead</surname> <given-names>B</given-names>
</name>
<name>
<surname>Salzberg</surname> <given-names>SL</given-names>
</name>
</person-group>. <article-title>Fast gapped-read alignment with Bowtie 2</article-title>. <source>Nat Methods</source>. (<year>2012</year>) <volume>9</volume>:<page-range>357&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.1923</pub-id>
</citation>
</ref>
<ref id="B43">
<label>43</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Danecek</surname> <given-names>P</given-names>
</name>
<name>
<surname>Bonfield</surname> <given-names>JK</given-names>
</name>
<name>
<surname>Liddle</surname> <given-names>J</given-names>
</name>
<name>
<surname>Marshall</surname> <given-names>J</given-names>
</name>
<name>
<surname>Ohan</surname> <given-names>V</given-names>
</name>
<name>
<surname>Pollard</surname> <given-names>MO</given-names>
</name>
<etal/>
</person-group>. <article-title>Twelve years of SAMtools and BCFtools</article-title>. <source>GigaScience</source>. (<year>2021</year>) <volume>10</volume>:<elocation-id>giab008</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gigascience/giab008</pub-id>
</citation>
</ref>
<ref id="B44">
<label>44</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Madeira</surname> <given-names>F</given-names>
</name>
<name>
<surname>Pearce</surname> <given-names>M</given-names>
</name>
<name>
<surname>Tivey</surname> <given-names>ARN</given-names>
</name>
<name>
<surname>Basutkar</surname> <given-names>P</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>J</given-names>
</name>
<name>
<surname>Edbali</surname> <given-names>O</given-names>
</name>
<etal/>
</person-group>. <article-title>Search and sequence analysis tools services from EMBL-EBI in 2022</article-title>. <source>Nucleic Acids Res</source>. (<year>2022</year>) <volume>50</volume>:<page-range>W276&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkac240</pub-id>
</citation>
</ref>
<ref id="B45">
<label>45</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname> <given-names>NP</given-names>
</name>
<name>
<surname>Leroy</surname> <given-names>C</given-names>
</name>
<name>
<surname>Sander</surname> <given-names>C</given-names>
</name>
</person-group>. <article-title>MView: a web-compatible database search or multiple alignment viewer</article-title>. <source>Bioinformatics</source>. (<year>1998</year>) <volume>14</volume>:<page-range>380&#x2013;1</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/14.4.380</pub-id>
</citation>
</ref>
<ref id="B46">
<label>46</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ehrenmann</surname> <given-names>F</given-names>
</name>
<name>
<surname>Kaas</surname> <given-names>Q</given-names>
</name>
<name>
<surname>Lefranc</surname> <given-names>M-P</given-names>
</name>
</person-group>. <article-title>IMGT/3Dstructure-DB and IMGT/DomainGapAlign: a database and a tool for immunoglobulins or antibodies, T cell receptors, MHC, IgSF and MhcSF</article-title>. <source>Nucleic Acids Res</source>. (<year>2010</year>) <volume>38</volume>:<page-range>D301&#x2013;307</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkp946</pub-id>
</citation>
</ref>
<ref id="B47">
<label>47</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cock</surname> <given-names>PJA</given-names>
</name>
<name>
<surname>Antao</surname> <given-names>T</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>JT</given-names>
</name>
<name>
<surname>Chapman</surname> <given-names>BA</given-names>
</name>
<name>
<surname>Cox</surname> <given-names>CJ</given-names>
</name>
<name>
<surname>Dalke</surname> <given-names>A</given-names>
</name>
<etal/>
</person-group>. <article-title>Biopython: freely available Python tools for computational molecular biology and bioinformatics</article-title>. <source>Bioinformatics</source>. (<year>2009</year>) <volume>25</volume>:<page-range>1422&#x2013;3</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btp163</pub-id>
</citation>
</ref>
<ref id="B48">
<label>48</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hall</surname> <given-names>BG</given-names>
</name>
</person-group>. <article-title>Building phylogenetic trees from molecular data with MEGA</article-title>. <source>Mol Biol Evol</source>. (<year>2013</year>) <volume>30</volume>:<page-range>1229&#x2013;35</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/mst012</pub-id>
</citation>
</ref>
<ref id="B49">
<label>49</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tamura</surname> <given-names>K</given-names>
</name>
<name>
<surname>Stecher</surname> <given-names>G</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>MEGA11: molecular evolutionary genetics analysis version 11</article-title>. <source>Mol Biol Evol</source>. (<year>2021</year>) <volume>38</volume>:<page-range>3022&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msab120</pub-id>
</citation>
</ref>
<ref id="B50">
<label>50</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Letunic</surname> <given-names>I</given-names>
</name>
<name>
<surname>Bork</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Interactive Tree Of Life (iTOL) v5: an online tool for phylogenetic tree display and annotation</article-title>. <source>Nucleic Acids Res</source>. (<year>2021</year>) <volume>49</volume>:<page-range>W293&#x2013;6</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkab301</pub-id>
</citation>
</ref>
<ref id="B51">
<label>51</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Okonechnikov</surname> <given-names>K</given-names>
</name>
<name>
<surname>Golosova</surname> <given-names>O</given-names>
</name>
<name>
<surname>Fursov</surname> <given-names>M</given-names>
</name>
<collab>The UGENE Team</collab>
</person-group>. <article-title>Unipro UGENE: a unified bioinformatics toolkit&#x2019;</article-title>. <source>Bioinformatics</source>. (<year>2012</year>) <volume>28</volume>:<page-range>1166&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts091</pub-id>
</citation>
</ref>
<ref id="B52">
<label>52</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zulkower</surname> <given-names>V</given-names>
</name>
<name>
<surname>Rosser</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>DNA Features Viewer: a sequence annotation formatting and plotting library for Python</article-title>. <source>Bioinformatics</source>. (<year>2020</year>) <volume>36</volume>:<page-range>4350&#x2013;2</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btaa213</pub-id>
</citation>
</ref>
<ref id="B53">
<label>53</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Turchaninova</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Davydov</surname> <given-names>A</given-names>
</name>
<name>
<surname>Britanova</surname> <given-names>OV</given-names>
</name>
<name>
<surname>Shugay</surname> <given-names>M</given-names>
</name>
<name>
<surname>Bikos</surname> <given-names>V</given-names>
</name>
<name>
<surname>Egorov</surname> <given-names>ES</given-names>
</name>
<etal/>
</person-group>. <article-title>High-quality full-length immunoglobulin profiling with unique molecular barcoding</article-title>. <source>Nat Protoc</source>. (<year>2016</year>) <volume>11</volume>:<page-range>1599&#x2013;616</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nprot.2016.093</pub-id>
</citation>
</ref>
<ref id="B54">
<label>54</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Migalska</surname> <given-names>M</given-names>
</name>
<name>
<surname>Sebastian</surname> <given-names>A</given-names>
</name>
<name>
<surname>Radwan</surname> <given-names>J</given-names>
</name>
</person-group>. <article-title>Profiling of the TCR&#x3b2; repertoire in non-model species using high-throughput sequencing</article-title>. <source>Sci Rep</source>. (<year>2018</year>) <volume>8</volume>:<fpage>11613</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-018-30037-0</pub-id>
</citation>
</ref>
<ref id="B55">
<label>55</label>
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Andrews</surname> <given-names>S</given-names>
</name>
</person-group>. <article-title>FastQC: a quality control tool for high throughput sequence data</article-title>. (<year>2010</year>). Available online at: <uri xlink:href="https://www.bioinformatics.babraham.ac.uk/projects/fastqc/">https://www.bioinformatics.babraham.ac.uk/projects/fastqc/</uri>.</citation>
</ref>
<ref id="B56">
<label>56</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ewels</surname> <given-names>P</given-names>
</name>
<name>
<surname>Magnusson</surname> <given-names>M</given-names>
</name>
<name>
<surname>Lundin</surname> <given-names>S</given-names>
</name>
<name>
<surname>K&#xe4;ller</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>MultiQC: summarize analysis results for multiple tools and samples in a single report</article-title>. <source>Bioinformatics</source>. (<year>2016</year>) <volume>32</volume>:<page-range>3047&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btw354</pub-id>
</citation>
</ref>
<ref id="B57">
<label>57</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bolotin</surname> <given-names>DA</given-names>
</name>
<name>
<surname>Poslavsky</surname> <given-names>S</given-names>
</name>
<name>
<surname>Mitrophanov</surname> <given-names>I</given-names>
</name>
<name>
<surname>Shugay</surname> <given-names>M</given-names>
</name>
<name>
<surname>Mamedov</surname> <given-names>IZ</given-names>
</name>
<name>
<surname>Putintseva</surname> <given-names>EV</given-names>
</name>
<etal/>
</person-group>. <article-title>MiXCR: software for comprehensive adaptive immunity profiling</article-title>. <source>Nat Methods</source>. (<year>2015</year>) <volume>12</volume>:<page-range>380&#x2013;1</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.3364</pub-id>
</citation>
</ref>
<ref id="B58">
<label>58</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hunter</surname> <given-names>JD</given-names>
</name>
</person-group>. <article-title>Matplotlib: A 2D graphics environment</article-title>. <source>Computing Sci Eng</source>. (<year>2007</year>) <volume>9</volume>:<page-range>90&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/MCSE.2007.55</pub-id>
</citation>
</ref>
<ref id="B59">
<label>59</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Harris</surname> <given-names>CR</given-names>
</name>
<name>
<surname>Millman</surname> <given-names>KJ</given-names>
</name>
<name>
<surname>van der Walt</surname> <given-names>SJ</given-names>
</name>
<name>
<surname>Gommers</surname> <given-names>R</given-names>
</name>
<name>
<surname>Virtanen</surname> <given-names>P</given-names>
</name>
<name>
<surname>Cournapeau</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>Array programming with numPy</article-title>. <source>Nature</source>. (<year>2020</year>) <volume>585</volume>:<page-range>357&#x2013;62</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-020-2649-2</pub-id>
</citation>
</ref>
<ref id="B60">
<label>60</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Virtanen</surname> <given-names>P</given-names>
</name>
<name>
<surname>Gommers</surname> <given-names>R</given-names>
</name>
<name>
<surname>Oliphant</surname> <given-names>TE</given-names>
</name>
<name>
<surname>Haberland</surname> <given-names>M</given-names>
</name>
<name>
<surname>Reddy</surname> <given-names>T</given-names>
</name>
<name>
<surname>Cournapeau</surname> <given-names>D</given-names>
</name>
<etal/>
</person-group>. <article-title>SciPy 1.0: fundamental algorithms for scientific computing in Python</article-title>. <source>Nat Methods</source>. (<year>2020</year>) <volume>17</volume>:<page-range>261&#x2013;72</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41592-019-0686-2</pub-id>
</citation>
</ref>
<ref id="B61">
<label>61</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Waskom</surname> <given-names>M</given-names>
</name>
</person-group>. <article-title>seaborn: statistical data visualization</article-title>. <source>J Open Source Software</source>. (<year>2021</year>) <volume>6</volume>:<elocation-id>3021</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.21105/joss.03021</pub-id>
</citation>
</ref>
<ref id="B62">
<label>62</label>
<citation citation-type="book">
<person-group person-group-type="author">
<collab>The pandas development team</collab>
</person-group>. <source>pandas-dev/pandas: Pandas (v1.5.2)</source>. <publisher-name>Zenodo</publisher-name> (<year>2022</year>). doi:&#xa0;<pub-id pub-id-type="doi">10.5281/zenodo.7344967</pub-id>
</citation>
</ref>
<ref id="B63">
<label>63</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wickham</surname> <given-names>H</given-names>
</name>
</person-group>. <article-title>Reshaping data with the reshape package</article-title>. <source>J Stat Software</source>. (<year>2007</year>) <volume>21</volume>:<fpage>1</fpage>&#x2013;<lpage>20</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.18637/jss.v021.i12</pub-id>
</citation>
</ref>
<ref id="B64">
<label>64</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wickham</surname> <given-names>H</given-names>
</name>
<name>
<surname>Averick</surname> <given-names>M</given-names>
</name>
<name>
<surname>Bryan</surname> <given-names>J</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>W</given-names>
</name>
<name>
<surname>McGowan</surname> <given-names>LD</given-names>
</name>
<name>
<surname>Fran&#xe7;ois</surname> <given-names>R</given-names>
</name>
<etal/>
</person-group>. <article-title>Welcome to the tidyverse</article-title>. <source>J Open Source Software</source>. (<year>2019</year>) <volume>4</volume>:<elocation-id>1686</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.21105/joss.01686</pub-id>
</citation>
</ref>
<ref id="B65">
<label>65</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Venables</surname> <given-names>WN</given-names>
</name>
<name>
<surname>Ripley</surname> <given-names>BD</given-names>
</name>
</person-group>. <source>
<italic>Modern Applied Statistics with S.</italic> Fourth</source>. <publisher-loc>New York</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2002</year>). Available at: <uri xlink:href="https://www.stats.ox.ac.uk/pub/MASS4/">https://www.stats.ox.ac.uk/pub/MASS4/</uri>.</citation>
</ref>
<ref id="B66">
<label>66</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Fox</surname> <given-names>J</given-names>
</name>
<name>
<surname>Weisberg</surname> <given-names>S</given-names>
</name>
</person-group>. <source>An R Companion to Applied Regression</source>. <edition>3rd ed</edition>. <publisher-loc>Thousand Oaks CA</publisher-loc>: <publisher-name>Sage</publisher-name> (<year>2019</year>). Available at: <uri xlink:href="https://socialsciences.mcmaster.ca/jfox/Books/Companion/">https://socialsciences.mcmaster.ca/jfox/Books/Companion/</uri>.</citation>
</ref>
<ref id="B67">
<label>67</label>
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Lenth</surname> <given-names>RV</given-names>
</name>
<name>
<surname>Bolker</surname> <given-names>B</given-names>
</name>
<name>
<surname>Buerkner</surname> <given-names>P</given-names>
</name>
<name>
<surname>Gin&#xe9;-V&#xe1;zquez</surname> <given-names>I</given-names>
</name>
<name>
<surname>Herve</surname> <given-names>M</given-names>
</name>
<name>
<surname>Jung</surname> <given-names>M</given-names>
</name>
<etal/>
</person-group>. <article-title>emmeans: Estimated Marginal Means, aka Least-Squares Means</article-title>. (<year>2024</year>). Available online at: <uri xlink:href="https://cran.r-project.org/web/packages/emmeans/index.html">https://cran.r-project.org/web/packages/emmeans/index.html</uri> (Accessed <access-date>9 February 2024</access-date>).</citation>
</ref>
<ref id="B68">
<label>68</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cowell</surname> <given-names>LG</given-names>
</name>
<name>
<surname>Davila</surname> <given-names>M</given-names>
</name>
<name>
<surname>Kepler</surname> <given-names>TB</given-names>
</name>
<name>
<surname>Kelsoe</surname> <given-names>G</given-names>
</name>
</person-group>. <article-title>Identification and utilization of arbitrary correlations in models of recombination signal sequences</article-title>. <source>Genome Biol</source>. (<year>2002</year>) <volume>3</volume>:<fpage>research0072.1</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/gb-2002-3-12-research0072</pub-id>
</citation>
</ref>
<ref id="B69">
<label>69</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Glusman</surname> <given-names>G</given-names>
</name>
<name>
<surname>Rowen</surname> <given-names>L</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>I</given-names>
</name>
<name>
<surname>Boysen</surname> <given-names>C</given-names>
</name>
<name>
<surname>Roach</surname> <given-names>JC</given-names>
</name>
<name>
<surname>Smit</surname> <given-names>AFA</given-names>
</name>
<etal/>
</person-group>. <article-title>Comparative genomics of the human and mouse T cell receptor loci</article-title>. <source>Immunity</source>. (<year>2001</year>) <volume>15</volume>:<page-range>337&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S1074-7613(01)00200-X</pub-id>
</citation>
</ref>
<ref id="B70">
<label>70</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pannetier</surname> <given-names>C</given-names>
</name>
<name>
<surname>Cochet</surname> <given-names>M</given-names>
</name>
<name>
<surname>Darche</surname> <given-names>S</given-names>
</name>
<name>
<surname>Casrouge</surname> <given-names>A</given-names>
</name>
<name>
<surname>Z&#xf6;ller</surname> <given-names>M</given-names>
</name>
<name>
<surname>Kourilsky</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>The sizes of the CDR3 hypervariable regions of the murine T-cell receptor beta chains vary as a function of the recombined germ-line segments</article-title>. <source>Proc Natl Acad Sci USA</source>. (<year>1993</year>) <volume>90</volume>:<page-range>4319&#x2013;23</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.90.9.4319</pub-id>
</citation>
</ref>
<ref id="B71">
<label>71</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cibotti</surname> <given-names>R</given-names>
</name>
<name>
<surname>Cabaniols</surname> <given-names>JP</given-names>
</name>
<name>
<surname>Pannetier</surname> <given-names>C</given-names>
</name>
<name>
<surname>Delarbre</surname> <given-names>C</given-names>
</name>
<name>
<surname>Vergnon</surname> <given-names>I</given-names>
</name>
<name>
<surname>Kanellopoulos</surname> <given-names>JM</given-names>
</name>
<etal/>
</person-group>. <article-title>Public and private V beta T cell receptor repertoires against hen egg white lysozyme (HEL) in nontransgenic versus HEL transgenic mice</article-title>. <source>J Exp Med</source>. (<year>1994</year>) <volume>180</volume>:<page-range>861&#x2013;72</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1084/jem.180.3.861</pub-id>
</citation>
</ref>
<ref id="B72">
<label>72</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname> <given-names>M</given-names>
</name>
<name>
<surname>Li</surname> <given-names>B</given-names>
</name>
</person-group>. <article-title>T cell receptor convergence is an indicator of antigen-specific T cell response in cancer immunotherapies</article-title>. <source>eLife</source>. (<year>2022</year>) <volume>11</volume>:<elocation-id>e81952</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.7554/eLife.81952</pub-id>
</citation>
</ref>
<ref id="B73">
<label>73</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Woodsworth</surname> <given-names>DJ</given-names>
</name>
<name>
<surname>Castellarin</surname> <given-names>M</given-names>
</name>
<name>
<surname>Holt</surname> <given-names>RA</given-names>
</name>
</person-group>. <article-title>Sequence analysis of T-cell repertoires in health and disease</article-title>. <source>Genome Med</source>. (<year>2013</year>) <volume>5</volume>:<fpage>98</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/gm502</pub-id>
</citation>
</ref>
<ref id="B74">
<label>74</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lefranc</surname> <given-names>M-P</given-names>
</name>
</person-group>. <article-title>IMGT, the international imMunoGeneTics information system</article-title>. <source>Cold Spring Harbor Protoc</source>. (<year>2011</year>) <volume>2011</volume>:<fpage>595</fpage>&#x2013;<lpage>603</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/pdb.top115</pub-id>
</citation>
</ref>
<ref id="B75">
<label>75</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mian</surname> <given-names>IS</given-names>
</name>
<name>
<surname>Bradwell</surname> <given-names>AR</given-names>
</name>
<name>
<surname>Olson</surname> <given-names>AJ</given-names>
</name>
</person-group>. <article-title>Structure, function and properties of antibody binding sites</article-title>. <source>J Mol Biol</source>. (<year>1991</year>) <volume>217</volume>:<page-range>133&#x2013;51</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0022-2836(91)90617-F</pub-id>
</citation>
</ref>
<ref id="B76">
<label>76</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prochnicka-Chalufour</surname> <given-names>A</given-names>
</name>
<name>
<surname>Casanova</surname> <given-names>J-L</given-names>
</name>
<name>
<surname>Avrameas</surname> <given-names>S</given-names>
</name>
<name>
<surname>Claverie</surname> <given-names>J-M</given-names>
</name>
<name>
<surname>Kourilsky</surname> <given-names>P</given-names>
</name>
</person-group>. <article-title>Biased amino acid distributions in regions of the T cell receptors and MHC molecules potentially involved in their association</article-title>. <source>Int Immunol</source>. (<year>1991</year>) <volume>3</volume>:<page-range>853&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/intimm/3.9.853</pub-id>
</citation>
</ref>
<ref id="B77">
<label>77</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zemlin</surname> <given-names>M</given-names>
</name>
<name>
<surname>Klinger</surname> <given-names>M</given-names>
</name>
<name>
<surname>Link</surname> <given-names>J</given-names>
</name>
<name>
<surname>Zemlin</surname> <given-names>C</given-names>
</name>
<name>
<surname>Bauer</surname> <given-names>K</given-names>
</name>
<name>
<surname>Engler</surname> <given-names>JA</given-names>
</name>
<etal/>
</person-group>. <article-title>Expressed murine and human CDR-H3 intervals of equal length exhibit distinct repertoires that differ in their amino acid composition and predicted range of structures</article-title>. <source>J Mol Biol</source>. (<year>2003</year>) <volume>334</volume>:<page-range>733&#x2013;49</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jmb.2003.10.007</pub-id>
</citation>
</ref>
<ref id="B78">
<label>78</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koide</surname> <given-names>S</given-names>
</name>
<name>
<surname>Sidhu</surname> <given-names>SS</given-names>
</name>
</person-group>. <article-title>The importance of being tyrosine: lessons in molecular recognition from minimalist synthetic binding proteins</article-title>. <source>ACS Chem Biol</source>. (<year>2009</year>) <volume>4</volume>:<page-range>325&#x2013;34</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/cb800314v</pub-id>
</citation>
</ref>
<ref id="B79">
<label>79</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hung</surname> <given-names>S-J</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y-L</given-names>
</name>
<name>
<surname>Chu</surname> <given-names>C-H</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>C-C</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>W-L</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>Y-L</given-names>
</name>
<etal/>
</person-group>. <article-title>TRIg: a robust alignment pipeline for non-regular T-cell receptor and immunoglobulin sequences</article-title>. <source>BMC Bioinf</source>. (<year>2016</year>) <volume>17</volume>:<fpage>433</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12859-016-1304-2</pub-id>
</citation>
</ref>
<ref id="B80">
<label>80</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shugay</surname> <given-names>M</given-names>
</name>
<name>
<surname>Britanova</surname> <given-names>OV</given-names>
</name>
<name>
<surname>Merzlyak</surname> <given-names>EM</given-names>
</name>
<name>
<surname>Turchaninova</surname> <given-names>MA</given-names>
</name>
<name>
<surname>Mamedov</surname> <given-names>IZ</given-names>
</name>
<name>
<surname>Tuganbaev</surname> <given-names>TR</given-names>
</name>
<etal/>
</person-group>. <article-title>Towards error-free profiling of immune repertoires</article-title>. <source>Nat Methods</source>. (<year>2014</year>) <volume>11</volume>:<page-range>653&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.2960</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>