<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Immunol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Immunology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Immunol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-3224</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fimmu.2026.1749369</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Ensemble molecular mimicry correlates with antibody cross-reactivity in proteome-wide studies</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Wrabl</surname><given-names>James O.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3332886/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Beale</surname><given-names>Josh</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Fortunato</surname><given-names>Gabriel</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Monsalve</surname><given-names>Antonieta van den Berg</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Hilser</surname><given-names>Vincent J.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<xref ref-type="author-notes" rid="fn004"><sup>&#x2021;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3284048/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Department of Biology, Johns Hopkins University</institution>, <city>Baltimore MD</city>,&#xa0;<country country="us">United States</country></aff>
<aff id="aff2"><label>2</label><institution>Cell, Molecular, Developmental Biology, and Biophysics Graduate Program, Johns Hopkins University</institution>, <city>Baltimore MD</city>,&#xa0;<country country="us">United States</country></aff>
<aff id="aff3"><label>3</label><institution>T. C. Jenkins Department of Biophysics, Johns Hopkins University</institution>, <city>Baltimore MD</city>,&#xa0;<country country="us">United States</country></aff>
<aff id="aff4"><label>4</label><institution>Program in Molecular Biophysics Graduate Program, Johns Hopkins University</institution>, <city>Baltimore MD</city>,&#xa0;<country country="us">United States</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Vincent J. Hilser, <email xlink:href="mailto:Hilser@jhu.edu">Hilser@jhu.edu</email></corresp>
<fn fn-type="present-address" id="fn003">
<label>&#x2020;</label>
<p>Present address: Antonieta van den Berg Monsalve, Department of Biology, Otterbein University, Westerville OH, United States</p></fn>
<fn fn-type="other" id="fn004">
<label>&#x2021;</label>
<p>ORCID: Vincent J. Hilser, <uri xlink:href="https://orcid.org/0000-0002-7173-0073">orcid.org/0000-0002-7173-0073</uri></p></fn>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-10">
<day>10</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1749369</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>14</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Wrabl, Beale, Fortunato, Monsalve and Hilser.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Wrabl, Beale, Fortunato, Monsalve and Hilser</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-10">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Energetics of protein&#x2013;protein binding necessarily include contributions both from conformational equilibria and from interfacial interactions. In the particular case of an antibody binding to a protein epitope, the conformational contribution is typically neglected as the antibody-bound and free forms of the protein are usually highly similar, leading to the reasonable conclusion that binding affinity in most cases can be reconciled in the context of observed interfacial interactions. However, the phenomenon of molecular mimicry has also been widely observed, wherein antibodies raised against one sequence/structure are able to recognize a completely different sequence/structure. This observation suggests that, in some cases, the conformational contribution could play a significant role in facilitating this cross-reactivity. Here, this conjecture is supported, utilizing a recent discovery that permits evaluation of the thermodynamic compatibility of any sequence for the conformational ensemble of any other protein&#x2014;in effect providing direct access to the conformational contribution to binding. The importance of the contribution could then be assessed on a proteome-wide scale, in the context of the unexpected cross-reactivity observed when the human proteome is challenged with antibodies raised against a set of virus protein antigens. Because the virus protein antigens and the cross-reactive human proteins share substantial similarity when modeled as thermodynamic ensembles, despite the absence of detectable sequence or structural similarity, we hypothesize that these cross-reactive epitopes share a novel kind of immunological molecular mimicry, termed &#x201c;ensemble molecular mimicry&#x201d; (EMM). To investigate potential mechanisms, a sequence-based algorithm was developed to probe for the relationship between high scoring sequence segments and cross-reacting epitopes, and it was discovered that 9 of 11 medically relevant cross-reactive epitopes taken from the literature exhibited higher-than-expected local EMM values. Taken together, the results suggest that conformational equilibrium can affect affinity and that it is hypothetically possible for cross-reactive epitopes to share a pairwise thermodynamic signature, even in the absence of sequence or structural similarity.</p>
</abstract>
<kwd-group>
<kwd>autoimmunity</kwd>
<kwd>binding energetics</kwd>
<kwd>conformational equilibrium</kwd>
<kwd>polyclonal</kwd>
<kwd>protein ensemble</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. Funding was provided by NIH: R01-GM63747 and R01-GM121567. JB was supported by NIH T32-GM007231 training grant and GF was supported by NIH T32-GM008403 training grant.</funding-statement>
</funding-group>
<counts>
<fig-count count="7"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="47"/>
<page-count count="14"/>
<word-count count="8766"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Viral Immunology</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Thousands of high-resolution structures of antibody&#x2013;antigen complexes exist in the Protein Data Bank (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). This wealth of data has been transformative for the understanding of antibody specificity and computation of the intermolecular energetics underlying affinity. However, routine estimation of accurate binding energies from structure remains elusive and often requires resource-intensive simulations. As such, significant efforts have been directed towards force-field development and artificial intelligence-driven molecular modeling (<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B7">7</xref>), but despite these efforts, reliable prediction of which antibodies will bind to which antigens, and how tightly, is not currently achievable (<xref ref-type="bibr" rid="B8">8</xref>).</p>
<p>While the binding energetics at the antibody&#x2013;antigen interface are undoubtedly important and most accessible for study, less attention has been paid to the idea that every protein&#x2013;protein binding reaction also includes a contribution from the ensemble conformational equilibrium. There is always a separate energy cost for the antigen (as well as the antibody) to adopt the specific conformations necessary to form the complex, i.e., a free energy of stability upon which the population of binding-competent antigen, as dictated by statistical thermodynamics, depends. In the case of high-affinity, monoclonal antibody complexes, this contribution might be safely ignored, as strong interfacial atomic interactions would be expected to dominate overall binding affinity. For weaker polyclonal responses, however, ensemble conformational equilibrium can be the decisive factor, as demonstrated by the elegant pioneering experiments of Anfinsen and colleagues (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B10">10</xref>).</p>
<p>If ensemble conformational equilibrium is relevant to the polyclonal response to antigen, how can it be detected? In this work, we take a biophysical approach to the question by deploying state-of-the-art proteome chip technology, which enables large-scale measurements of relative binding affinities for a panel of polyclonal antibodies against nearly the entire human proteome (<italic>N</italic> ~ 20,000 proteins). These relative affinities are then compared to high-throughput computational estimates of ensemble conformational equilibrium developed in this laboratory, which are calculated in pairwise fashion between highest-affinity proteins from the chip and the antigens against which the polyclonal antibodies were raised.</p>
<p>In these experiments we test the null hypothesis that affinity and conformational equilibrium are unrelated, and based on modest but significant correlation between empirical affinities and computations, we conclude that ensemble conformational equilibrium should not be neglected as part of the polyclonal response. Furthermore, because the antigens are derived from a virus and the binding proteins come from the human proteome, the results report unexpected cross-reactivity and may help to explain documented cases of molecular mimicry in varied auto-immune diseases characterized by cross-reactive epitopes that do not exhibit obvious sequence or structure similarity (<xref ref-type="bibr" rid="B11">11</xref>&#x2013;<xref ref-type="bibr" rid="B14">14</xref>). Instead, we hypothesize a new type of epitope based on &#x201c;ensemble molecular mimicry&#x201d; (EMM), which could be revealed through detailed thermodynamic analysis of local conformational equilibria between pairs of proteins. This ensemble information may be useful for the future prediction of auto-antigenic proteins and epitopes.</p>
</sec>
<sec id="s2" sec-type="results">
<label>2</label>
<title>Results</title>
<sec id="s2_1">
<label>2.1</label>
<title>Fluorescence as a proxy for total binding free energy</title>
<p>We consider any macromolecular binding reaction, such as that between an antibody (Ab) and a specific antigen, as a series of two coupled equilibria (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref>) (<xref ref-type="bibr" rid="B9">9</xref>). In this scheme, binding free energy (&#x394;<italic>G</italic><sub>total</sub>) is influenced by at least two energetic contributions: An <italic>intrinsic</italic> contribution (&#x394;<italic>G</italic><sub>int</sub>) resulting from the interactions of particular chemical groups between the antibody and the antigen (such as hydrogen bonding, charge&#x2013;charge interactions, and hydrophobic packing), and a conformational contribution (&#x394;<italic>G</italic><sub>conf</sub>) reflecting the free energy required for the epitope to adopt a binding-competent geometry. We expect that the particular sequence of the amino acids at the binding interface is primarily accounted for by the &#x394;<italic>G</italic><sub>int</sub> term, whereas contributions associated with redistributing the conformational ensemble to those conformations capable of binding the antibody, e.g., protein folding, comprise the &#x394;<italic>G</italic><sub>conf</sub> term.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Conformational equilibrium contributes to binding affinity and affinity can be measured by proteome-on-a-chip technology. <bold>(A)</bold> Conformational equilibrium contributes to binding affinity. In general, coupled equilibria exist describing the binding between an antibody (black cartoon Y) and an antigen (colored beads-on-string cartoon). The free energy of binding (&#x394;<italic>G</italic><sub>total</sub>) has two major contributions: a free energy of the antigen epitope interacting with the antibody paratope (&#x394;<italic>G</italic><sub>int</sub>), and a free energy of the antigen epitope adopting the correct conformation to permit interaction (&#x394;<italic>G</italic><sub>conf</sub>). For binding to occur (orange box, right side), the antigen must adopt a binding-competent conformation (purple box, right side) as opposed to a binding-incompetent conformation (purple box, left side). Conformational equilibrium of the epitope between binding-incompetent and binding-competent shapes is suggested by the purple box. The hypothesis tested in this work is that while epitope sequence conservation is reflected by &#x394;<italic>G</italic><sub>int</sub>, thermodynamic molecular mimicry in the absence of sequence identity can be facilitated by a favorable &#x394;<italic>G</italic><sub>conf</sub>. <bold>(B)</bold> Affinity can be measured by proteome-on-a-chip technology. Almost the entire human proteome can be expressed, purified, and spotted on a nitrocellulose/glass chip (left side) using technology developed by CDI Laboratories, Inc. (Baltimore, MD). Each yellow spot represents many copies of a localized particular human protein. An antibody or serum sample (black cartoon Y) can be passed over the chip, probing all of the proteome simultaneously with a primary antibody. Binding of primary antibody to localized proteins on the chip can be quantified with a fluorescent secondary antibody (not shown), akin to a Western blot. Schematized locations of binding are shown by dots with shades of gray. It is assumed that degree of fluorescence is proportional to relative affinity.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1749369-g001.tif">
<alt-text content-type="machine-generated">A two-part illustration. Panel A shows the equation &#x394;G_total = &#x394;G_conf + &#x394;G_int, depicting conformational redistribution and antibody-epitope interaction processes. Structures and antibodies are shown with arrows indicating reversible reactions. Panel B illustrates the experimental setup: a chip with human proteome (~20,000 proteins) interacts with a polyclonal antibody, leading to measured cross-reactivity proportional to &#x394;G_total, represented by highlighted spots on the chip.</alt-text>
</graphic></fig>
<p>The classic view of antibody binding is one of rigid-body association, which assumes that the &#x394;<italic>G</italic><sub>conf</sub> term is relatively small and that tight binding originates from high structural compatibility between the Fab region of the antibody and the antigen that it binds. Indeed, high similarity is often observed when the structures of unbound and antibody-bound antigens are compared, supporting the notion that the conformational free energy difference between unbound and bound states is small, at least in those cases (&#x394;<italic>G</italic><sub>conf</sub> ~ 0) (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>). However, it is also well known that the antibody maturation process involves an initial polyclonal response, which consists of numerous sequence-distinct antibodies whose individual binding affinities are significantly lower than the mature (monoclonal) antibody, but whose collective binding affinity is relatively high. Moreover, the two contributors to overall binding energy may compensate for each other. For example, if an antigen readily populates a large sub-ensemble of conformational states, each of which can only provide sub-optimal contacts at the binding interface(s), then this &#x201c;penalty&#x201d; of a relatively high &#x394;<italic>G</italic><sub>int</sub> can be countered by a relatively low &#x394;<italic>G</italic><sub>conf</sub> (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref>). In other words, the bound complex can be conformationally heterogeneous, as schematically depicted in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref>.</p>
<p>Although the gold-standard measurement of binding affinity (&#x394;<italic>G</italic><sub>total</sub>) requires bulk-solution biophysical methods that monitor direct binding, such as isothermal titration calorimetry, fluorescence anisotropy, or nuclear magnetic resonance, these low-throughput methods are not amenable to proteome-scale measurements of antibody&#x2013;target complexes. To estimate &#x394;<italic>G</italic><sub>total</sub> on a large scale, we instead measure the secondary fluorescence signal generated when a primary antibody binds to a target protein localized on a nitrocellulose/glass chip, as implemented on <italic>HuProt</italic> chips by CDI Labs, Inc. (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1B</bold></xref>, Section 4.1). One <italic>HuProt</italic> chip can localize large numbers of folded proteins, including essentially the entire human proteome (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1B</bold></xref>), and the relative binding of an antibody sample probing the entire proteome can be quantified.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Thermodynamic similarity (eTFR) as a proxy for free energy of conformational equilibrium</title>
<p>The conformational equilibrium shown in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref> is akin to a free energy of folding, which is notoriously difficult to measure by high-throughput methods [although progress is being made (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>)]. For this work, we continue the development of a computational model of the energetics of the protein ensemble (<italic>COREX</italic>), which recently has been shown to measure the relative energetic distance (&#x394;<italic>G</italic><sub>conf</sub>) between two protein conformations (<xref ref-type="bibr" rid="B19">19</xref>&#x2013;<xref ref-type="bibr" rid="B21">21</xref>). In direct support of the current work, we demonstrated in those studies that protein sequences sharing no similarity can nonetheless adopt the same conformation, and that this propensity is predictable based on our characterization of ensembles from numerous proteins. Here, we go further and ask, if a sequence has a propensity to adopt an alternative fold, can that protein also be recognized by a ligand (or antibody) that binds that alternative fold? To address this question, we modified our previously presented methodology, as described briefly below.</p>
<p>Our approach is termed <italic>eScape</italic> Thermodynamic Fold Recognition (<italic>e</italic>TFR). <italic>e</italic>TFR merges two previously published computational resources. The <italic>eScape</italic> (<italic>e</italic>nergy land<italic>Scape</italic>) algorithm is a sequence-based predictor of the local folding stability (&#x394;<italic>G</italic>) of a protein, along with the enthalpic (apolar and polar &#x394;<italic>H</italic>) and entropic (<italic>T</italic>&#x394;<italic>S</italic> of apolar and polar solvation, as well as conformational <italic>T</italic>&#x394;<italic>S</italic>) components of that stability (<xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>). This algorithm generates the energy landscape of the protein ensemble from information provided by <italic>thermodynamics</italic>, not amino acid sequence or structure (<xref ref-type="bibr" rid="B24">24</xref>&#x2013;<xref ref-type="bibr" rid="B26">26</xref>). Specifically, the energy landscape identifies which regions of the protein are more or less locally stable (i.e., more or less likely to be populated in a locally structured conformation).</p>
<p>Thermodynamic Fold Recognition uses &#x201c;thermodynamic environments&#x201d; (<xref ref-type="bibr" rid="B27">27</xref>&#x2013;<xref ref-type="bibr" rid="B29">29</xref>), defined by the clustering of a large database of vectors {&#x394;<italic>G</italic>, &#x394;<italic>H</italic>, <italic>T</italic>&#x394;<italic>S</italic>}, to create a protein&#x2019;s &#x201c;thermodynamic profile&#x201d; (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B31">31</xref>), which is used as a query to search a database of arbitrary amino acid sequences. Each pairwise alignment in the search is scored by dynamic programming subject to a thermodynamic substitution matrix, and the significance of each score is computed against a calibrated null model (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B32">32</xref>). In short, <italic>e</italic>TFR uses a thermodynamic profile derived from <italic>eScape</italic> as a query to search a sequence database with a <italic>thermodynamic</italic> substitution matrix instead of an <italic>amino acid</italic> substitution matrix. Importantly, this procedure essentially quantifies the compatibility of a protein thermodynamic ensemble with an amino acid sequence, providing a potentially powerful alternative to traditional sequence&#x2013;sequence, sequence&#x2013;structure, or structure&#x2013;structure algorithms, especially when the information output of the traditional methods is undetectably low.</p>
<p>Highest-significance <italic>e</italic>TFR matches are reliably obtained when the sequence of an extant protein is queried against its native thermodynamic profile, while next-highest matches often occur when <italic>homologous sequences</italic> are queried against the same profile (<xref ref-type="bibr" rid="B32">32</xref>). It has also been demonstrated that thermodynamic similarity can exist even below the &#x201c;twilight zone&#x201d; of sequence identity (<xref ref-type="bibr" rid="B31">31</xref>). It is thus likely that significant <italic>e</italic>TFR matches between two sequence-dissimilar proteins could predict a substantially favorable value of &#x394;<italic>G</italic><sub>conf</sub>, indicating that the conformational ensembles of the two proteins overlap to some degree and that each protein (or parts thereof) may transiently populate similar local conformations to the other. If true, then antibodies raised against one protein (e.g., protein A) may bind to a second protein (e.g., protein B). This could happen because, as shown previously (<xref ref-type="bibr" rid="B19">19</xref>&#x2013;<xref ref-type="bibr" rid="B21">21</xref>), high sequence compatibility corresponds to a low &#x394;<italic>G</italic><sub>conf</sub> for the sequence of protein B to adopt the structure of protein A. Importantly, these potential cross-reactivities could occur even in the absence of sequence or structural similarity.</p>
<p>We have demonstrated predictable antibody cross-reactivity on a small scale in at least three prospective cases of sequence-dissimilar pairs of proteins&#x2014;one a member of the SARS-CoV-2 proteome and the other identified from the human proteome&#x2014;which exhibit a high <italic>e</italic>TFR significance between them (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1A</bold></xref>) and bind to the same antibody on Western blot (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1B</bold></xref>). Of potential medical significance, these unexpected observations of cross-reactivity correspond to three of seven human proteins for which autoantibodies have been previously documented in the blood sera of acute COVID-19 patients (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B13">13</xref>). We hypothesize that <italic>e</italic>TFR can report on the likelihood that two proteins, even ostensibly unrelated ones, share conformational ensemble similarity. In as much as the computed similarity has been shown to allow one protein to even adopt the fold of the second protein (<xref ref-type="bibr" rid="B19">19</xref>), without explicit consideration of structural complementarity, we were motivated to determine if those same principles applied to the thermodynamic signatures of epitopes, thus motivating the current proteome-wide study.</p>
<p>The workflow for <italic>e</italic>TFR matching is shown in <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>. Briefly, a thermodynamic profile of the virus antigen corresponding to a cognate polyclonal antibody (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>, Box 1, left) was computed with <italic>eScape</italic> from its amino acid sequence. As alluded to above, <italic>eScape</italic> is a machine-learning algorithm that in the simplest case generates a four-dimensional vector of thermodynamic descriptors {&#x394;<italic>G</italic>, &#x394;<italic>H</italic><sub>ap</sub>, &#x394;<italic>H</italic><sub>pol</sub>, <italic>T</italic>&#x394;<italic>S</italic><sub>conf</sub>} from each amino acid in a sequence, corresponding to the stability of the native (folded) state of the protein. Thermodynamic descriptors are mapped to thermodynamic environments (i.e., the closest cluster center of descriptors) observed in a large database of diverse proteins (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref> and Box 2). This reduces the four-dimensional thermodynamic descriptor space to a one-dimensional thermodynamic profile (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref> and Box 3, left, colored rectangles), for computational efficiency. Using standard dynamic programming, the thermodynamic profile can be optimally aligned to an arbitrary amino acid sequence (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref> and Box 3, left) and a significance can then be computed (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref> and Box 3, right). As mentioned above, in this work, the significance is considered a proxy for the &#x394;<italic>G</italic><sub>conf</sub> between the virus and human proteins used in the calculation (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>, bottom).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Workflow of &#x394;<italic>G</italic><sub>conf</sub> detection (ensemble molecular mimicry) using <italic>e</italic>TFR thermodynamic similarity. Two sequence-dissimilar epitopes (Box 1) exhibiting cross-reactivity to the same antibody (black cartoon Y) exist. The virus epitope (left) exhibits conformational equilibrium contributing to thermodynamic molecular mimicry with the human epitope, as depicted in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref>. Fluctuations are encoded by thermodynamic environments (TE, Box 2), as described in Section 5.3. Briefly, the sequence-based prediction software, <italic>eScape</italic>, locates each residue of the full-length protein within a TE space spanning the local free energy, enthalpy, entropy, amino acid size, and polarity observed in globular proteins. TEs are assigned as an eight-letter numerical &#x201c;alphabet&#x201d; (colored boxes) permitting standard methods of alignment score optimization to a human host protein, subject to a TE-amino acid substitution matrix; this process is termed <italic>eScape</italic> Thermodynamic fold recognition (<italic>e</italic>TFR). Calibration of optimal score against a parameterized null model results in a significance value (<italic>p</italic>-value), which is taken as an estimation of &#x394;<italic>G</italic><sub>conf</sub>, or thermodynamic molecular mimicry (Box 3). Thus, <italic>e</italic>TFR aligns two proteins with no explicit computation of amino acid sequence or structure similarity, instead using thermodynamic information, making it a suitable method for detection of low-sequence identity epitope similarities.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1749369-g002.tif">
<alt-text content-type="machine-generated">Flowchart illustrating the process of comparing virus antigen sequences to cross-reactive human protein sequences. Step 1 involves asserting identical polyclonal antibodies for possibly dissimilar virus and human sequences. Step 2 assigns thermodynamic environments to the virus antigen with a colorful 3D plot showing stability and polarity. Step 3 computes thermodynamic similarity between virus and human proteins using a significance score based on sequence alignment and conformational changes.</alt-text>
</graphic></fig>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Correlation between eTFR significance and chip fluorescence suggests association between &#x394;G<sub>conf</sub> and &#x394;G<sub>total</sub></title>
<p>A panel of seven commercial polyclonal primary antibodies, raised against seven SARS-CoV-2 full-length protein antigens, were passed over separate human proteome chips, under both native and denaturing conditions (Sections 4.1 and 4.2). These antibodies were chosen from a preliminary scan of the thermodynamic profiles of the SARS-CoV-2 proteome against the amino acid sequences of all proteins in the Protein Data Bank (<xref ref-type="bibr" rid="B2">2</xref>) (Section 4.4, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1A</bold></xref>). For each human protein spot on the chip, secondary antibody fluorescence proportional to primary antibody affinity was reported as a <italic>Z</italic>-score relative to all proteins on the chip, and the sum of native and denatured <italic>Z</italic>-scores for each human protein was calculated (sums were taken because fluorescence signals were found to be relatively independent of native or denatured conditions, cf. <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Cross-reactive epitopes are likely to be unstructured and continuous. Each point in the plot represents the fluorescence signal of one anti-virus antibody binding to the same human protein, measured under native conditions (<italic>x</italic>-axis) or denatured (8 M urea) conditions (<italic>y</italic>-axis). The strong correlation suggests that structured epitopes were not a general feature of any of the human proteins studied. There is one exception, namely, human NMD3 protein binding anti-SARS-Cov-2 nsp13 polyclonal, which suggests a signal for structured epitope(s). Data for these figures, and the proteins involved, are listed in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1749369-g003.tif">
<alt-text content-type="machine-generated">Scatter plot showing the correlation between relative native and denatured antibody binding responses, both measured in Chip Z-Scores. The correlation coefficient (r) is +0.78, with a p-value less than 10^-6, indicating a strong positive relationship.</alt-text>
</graphic></fig>
<p>The 10 strongest-binding human proteins against each of the seven anti-virus antibodies of the panel were prioritized as part of CDI Labs&#x2019; analysis report, so that 7 &#xd7; 10 = 70 protein pairs of virus antigen and human protein were reported as cross-reactive in the company&#x2019;s analysis (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>). The <italic>e</italic>TFR significances computed for each virus antigen&#x2019;s thermodynamic profile aligned to its paired human amino acid sequence was compared to the experimental binding affinity for the same pair. To explore the relationship between <italic>e</italic>TFR significance and binding affinity, the binding data from all seven chips were pooled, and the linear correlation between affinity and significance was directly calculated.</p>
<p>It might be expected that no relationship would exist between binding <italic>Z</italic>-score and <italic>e</italic>TFR significance&#x2014;after all, the protein ensemble model <italic>COREX</italic>/<italic>eScape</italic> and the TFR/<italic>e</italic>TFR methods were not parameterized with any energetic information from protein&#x2013;protein binding, nor were they trained with the structures of any antibody&#x2013;antigen complexes&#x2014;but indeed, a significant relationship (<italic>p</italic> = 5 &#xd7; 10<sup>&#x2212;3</sup>) was observed (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4A</bold></xref>). Insofar as <italic>Z</italic>-score and <italic>e</italic>TFR significance are related to &#x394;<italic>G</italic><sub>total</sub> and &#x394;<italic>G</italic><sub>conf</sub>, respectively, this finding suggests that (1) &#x394;<italic>G</italic><sub>conf</sub> contributes to &#x394;<italic>G</italic><sub>total</sub>, and (2) the magnitude of the contribution (i.e., the <italic>R</italic><sup>2</sup> value) is modest, approximately 10% for these cross-reactive protein pairs.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Sequence similarity does not contribute to &#x394;<italic>G</italic><sub>total</sub>, but &#x394;<italic>G</italic><sub>conf</sub> does. <bold>(A)</bold> Significant relationship between chip <italic>Z</italic>-score and <italic>e</italic>TFR significance suggests that &#x394;<italic>G</italic><sub>conf</sub> contributes to &#x394;<italic>G</italic><sub>total</sub>. Each point in the scatterplot represents one human protein compared to one virus protein. The <italic>x</italic>-axis denotes the computed thermodynamic similarity between the two proteins, which is related to &#x394;<italic>G</italic><sub>conf</sub>, as described in the text (Section 2.2). The <italic>y</italic>-axis denotes the experimental fluorescence measured as the relative binding of the human protein to the anti-virus protein antibody, which is related to &#x394;<italic>G</italic><sub>total</sub>, as described in the text (Section 2.1). A significant correlation suggests that &#x394;<italic>G</italic><sub>conf</sub> is associated with &#x394;<italic>G</italic><sub>total</sub>. <bold>(B)</bold> &#x394;<italic>G</italic><sub>conf</sub> contributes to &#x394;<italic>G</italic><sub>total</sub> despite the absence of sequence similarity. Each point in the scatterplot represents one human protein compared to one virus protein. The <italic>x</italic>-axis plots the computed optimal local sequence similarity between the two proteins. The <italic>y</italic>-axis plots the experimental fluorescence measured as the human protein binds to the anti-virus protein antibody, which is related to &#x394;<italic>G</italic><sub>total</sub>, as described in the text (Section 2.1). Lack of correlation suggests that sequence similarity is not associated with &#x394;<italic>G</italic><sub>total</sub>. Data for these figures, and the proteins involved, are listed in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1749369-g004.tif">
<alt-text content-type="machine-generated">Scatter plot A shows a positive correlation between relative antibody binding response and eTFR significance, with a correlation coefficient of 0.33 (p = 0.005). Scatter plot B indicates no correlation between binding response and FASTA &#x2212;log E-value, with a correlation coefficient of 0.00 (p = 0.96).</alt-text>
</graphic></fig>
<p>To rule out amino acid sequence identity as the driver for the correlation in <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4A</bold></xref>, sequence similarity was computed for the 70 virus&#x2013;human protein pairs by optimally aligning their full-length sequences using <italic>FASTA36</italic> (<xref ref-type="bibr" rid="B33">33</xref>) (Section 5.3). This local alignment algorithm is a stringent test for possible conserved sequence motifs as only the shortest, best match of highest sequence identity is reported, and random alignments are not considered. As no correlation was observed between <italic>Z</italic>-score and sequence similarity (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4B</bold></xref>), the possibility that amino acid identity represents the source of the correlation is not supported by these studies, which further suggests that the compatibility of a human protein sequence with a viral protein fold (i.e., a viral protein ensemble) is contributing to the overall binding affinity, &#x394;<italic>G</italic><sub>total.</sub></p>
</sec>
</sec>
<sec id="s3" sec-type="discussion">
<label>3</label>
<title>Discussion</title>
<sec id="s3_1">
<label>3.1</label>
<title>Thermodynamic similarity between full-length proteins and relation to epitopes</title>
<p>The importance of the finding that conformational compatibility between full-length sequences can contribute to antibody cross-reactivity cannot be overstated. Yet, identifying the underlying determinants in each case and establishing causality is challenging due to the nature of the information involved. To highlight these challenges, we first make a distinction between our previous findings and what we report here. In earlier work, we demonstrated that proteins, rather than being classified in static structural terms, could be represented in thermodynamic terms, which reflect the relative stabilities of the different parts of the protein in the functional ensemble (<xref ref-type="bibr" rid="B19">19</xref>). Importantly, we showed that globular proteins appear to share common patterns of amino acid composition within this thermodynamic framework, providing the basis for a statistical free energy calculation. This allowed us to evaluate the compatibility of any sequence with the thermodynamic environments of any other protein structure, regardless of sequence or structural similarity. Furthermore, the fact that (1) the score of a sequence for a fold was correlated with the empirical stability of that sequence in that fold (<xref ref-type="bibr" rid="B19">19</xref>), and (2) sequence mutations that increased the score for a different fold caused the sequence to switch folds (if the score were high enough) (<xref ref-type="bibr" rid="B19">19</xref>), directly demonstrates that the previously reported TFR scores provide a measure of thermodynamic compatibility (<italic>i.e</italic>., &#x394;<italic>G</italic><sub>conf</sub>) of the two ensembles&#x2014;in effect validating the notion that a new type of EMM is real and, to at least some degree, predictable in the context of full-length protein sequences.</p>
<p>The work presented here, on the other hand, investigates whether that same EMM plays a role in the well-known phenomenon of antibody cross-reactivity. We reasoned that for binding reactions wherein the &#x394;<italic>G</italic><sub>int</sub> term for antibody binding (cf. <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref>) is expected to be weak (as would be the case for the binding of proteins to antibodies raised against an entirely different protein), tight binding, if it were to be found at all, would be more likely to rely on a more favorable &#x394;<italic>G</italic><sub>conf</sub> term. Thus, challenging the human proteome with antibodies raised against seven viral proteins, which have no human homologs, provides a means for both identifying cases where cross-reactivity occurs, and determining the thermodynamic compatibility of the human sequence for the viral protein ensemble.</p>
<p>Unfortunately, the total binding energy (i.e., &#x394;<italic>G</italic><sub>total</sub>) for the cross-reacting antibodies consists of both &#x394;<italic>G</italic><sub>conf</sub>, which is computed, and the individual &#x394;<italic>G</italic><sub>int</sub> terms, which will likely vary on a case-by-case basis and may involve other mechanisms. Thus, although the absence of sequence and structural similarity precludes other types of reported mimicry mechanisms playing a role [see (<xref ref-type="bibr" rid="B34">34</xref>) and discussion below], we cannot conclude that all of the cross-reactivity is due to the ensemble similarity. However, the fact that a modest but statistically significant (<italic>p</italic> = 0.005) correlation is observed (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4A</bold></xref>), even in the absence of recognizable sequence identity (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4B</bold></xref>), strongly supports the hypothesis that conformational free energy (&#x394;<italic>G</italic><sub>conf</sub>) plays a role in antibody cross-reactivity across the proteome. The fact that the approach further reveals high thermodynamic scores for known cross-reactive epitopes (cf. <xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref> and discussion below), even though none of the proteins involved (or any antibodies) were included in the algorithmic development, demonstrates this point and highlights what we can conclude from these results and what we cannot. Succinctly put, the approach identifies what other protein sequences can sample the conformational ensemble of the antigenic protein, but it does not propose a specific mechanism for antibody cross-reactivity for each case. Instead, the results demonstrate that the full-length protein ensemble compatibility (i.e., mimicry) reported previously (<xref ref-type="bibr" rid="B19">19</xref>) and embodied in the &#x394;<italic>G</italic><sub>conf</sub> term in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref> appears to contribute meaningfully to &#x394;<italic>G</italic><sub>total</sub>, when viewed across the proteome, being especially evident when probing specifically for cross-reactivity. Perhaps the most important result is that this approach can provide investigators with the ability to determine which protein sequences have a significant compatibility with the ensemble of another protein (and thus can potentially cross-react with antibodies raised against that protein). This capability could be especially useful in detecting thermodynamic compatibility where no recognizable sequence or structural similarity exists.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Known examples of medically relevant cross-reactive epitopes anecdotally share thermodynamic similarity in the absence of sequence similarity. <bold>(A)</bold> Four cases of known cross-reactive epitopes implicated in auto-immune disease molecular mimicry. For each example, an intriguing correspondence between the predicted <italic>eScape</italic> local stabilities of the published aligned epitopes are observed. Amino acid identities are highlighted in bold green font, emphasizing the lack of homology between the epitopes as the identities range from only 8% to 33%. Multiple sclerosis (<xref ref-type="bibr" rid="B38">38</xref>) (upper left): virus protein Epstein&#x2013;Barr Virus Nuclear Antigen-1, residues 411&#x2013;426 (blue), and human Myelin Basic Protein, residues 205&#x2013;224 (red); Graves&#x2019; disease (<xref ref-type="bibr" rid="B37">37</xref>) (lower left): human thyroid peroxidase, residues 536&#x2013;547 (blue), and human thyroid peroxidase, residues 539&#x2013;550 (red); auto-immune encephalomyelitis (<xref ref-type="bibr" rid="B11">11</xref>) (lower right): human Myelin Basic Protein, residues 68&#x2013;95 (blue), and Chlamydia cysteine-rich outer membrane protein peptide (CRP, red); rheumatoid arthritis (<xref ref-type="bibr" rid="B11">11</xref>) (upper right): Glucose-6-phosphate isomerase, residues 282&#x2013;294 (blue), and Bovine RNase, residues 42&#x2013;46 (red). <bold>(B)</bold><italic>FVC</italic> program indicates that known cross-reactive epitopes exhibit higher-than-average thermodynamic similarity. Box-and-whiskers plots were made using cosine similarity output from FVC, as described in Section 4.6. Error bars encompass the maximum and minimum cosine similarity scores of the background, the blue box encloses one-half of the background data, and the horizontal line within denotes the average. Cosine similarities for known epitopes (red points) are consistently higher than expected by the background distributions for the full-length proteins from which they are derived (blue). The significance of 9 out of 11 epitopes scoring higher than average is estimated to be <italic>p</italic> &lt; 0.05. Numbers on the <italic>x</italic>-axis correspond to the following epitopes: (1) Multiple Sclerosis PLP and MHV proteins (<xref ref-type="bibr" rid="B11">11</xref>), (2) Multiple Sclerosis PLP and <italic>H. influenzae</italic> proteins (<xref ref-type="bibr" rid="B11">11</xref>), (3) Multiple Sclerosis MHV and <italic>H. influenzae</italic> proteins (<xref ref-type="bibr" rid="B11">11</xref>), (4) Encephalomyelitis MBP and <italic>C. pneumoniae</italic> proteins (<xref ref-type="bibr" rid="B11">11</xref>), (5) Myocarditis Myosin and CRP proteins (<xref ref-type="bibr" rid="B11">11</xref>), (6) Irritable Bowel Syndrome Mouse Hsp60 and Mycobacterium GroEL (<xref ref-type="bibr" rid="B11">11</xref>), (7) Rheumatoid Arthritis GPI and RNase (<xref ref-type="bibr" rid="B11">11</xref>), (8) Multiple Sclerosis Human MBP and Epstein&#x2013;Barr Virus protein (<xref ref-type="bibr" rid="B11">11</xref>), (9) Liver autoimmunity Mouse FAH and MHV protein (<xref ref-type="bibr" rid="B46">46</xref>), (10) Multi-inflammatory syndrome in children Human SNX8 and SARS-CoV-2 orf9 (<xref ref-type="bibr" rid="B47">47</xref>), and (11) Multiple Sclerosis EBNA-1 and Human MBP (<xref ref-type="bibr" rid="B38">38</xref>). Numbers 4, 7, and 11 are also explicitly shown in Figure <bold>(A)</bold>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1749369-g005.tif">
<alt-text content-type="machine-generated">Chart A presents eScape &#x394;G values in kcal/mol for conditions: Multiple Sclerosis, Rheumatoid Arthritis, Graves&#x2019; Disease, and Autoimmune Encephalomyelitis, with sequences highlighted. Chart B shows box plots of 8D Thermodynamic Cosine Similarity against known cross-reactive epitope numbers, with known epitopes marked in red and background distribution in blue.</alt-text>
</graphic></fig>
<p>Given the correlation between binding and conformational contribution reported here, and the caveats noted above, the questions, nonetheless, rightly turn to identifying the range of biophysical mechanisms for the unexpected cross-reactivity, and the location of the epitope(s). Is there a correlation between the epitope and the calculated high-scoring residues? Should there be? We note that unlike comparing experimental and calculated energies arising from the binding interface (<xref ref-type="bibr" rid="B35">35</xref>, <xref ref-type="bibr" rid="B36">36</xref>), where the contribution of individual positions is explicitly computed, there is no obligatory position-specific correspondence; sequence determinants that result in high agreement of one sequence for an ensemble need not correspond to the amino acids that serve as the epitope for the actual binding part of the reaction (cf. <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref>). This point is made clear by considering that amino acids in stable, internal environments will contribute positively to high TFR scores, but epitopes are usually located primarily in less stable, surface-exposed sites (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>). Consistent with this reasoning, it is noteworthy that our computational methods consider the full-length sequence of the antigen and cross-reacting proteins, and make no predictions about where the binding interfaces between antibody and antigen might be, as they are in principle unrelated. The situation is complicated further by the use of polyclonal antibodies, as, for example, the following two alternatives cannot be differentiated given an empirical binding affinity: (a) That many antibodies bind weakly to many epitopes on a given human protein, and the experimental signal is an integration of this heterogeneous response by the protein averaged over the ensemble, or (b) that few antibodies bind strongly to a single epitope on a given human protein, leading to the same experimental signal as (a).</p>
<p>The observed correlation between conformational equilibrium and relative antibody binding is also formally consistent with alternative models. For example, two or more distinct antibody populations within the polyclonal response could each bind unrelated epitopes on the virus and human proteins. In such a scenario, the association with ensemble similarity would still hold, but there would be no correspondence between the epitope and the scoring. These possibilities notwithstanding, identifying the location(s) of epitopes would help identify the range of scenarios and would further our understanding of this phenomenon. Distinguishing between these several possibilities positions techniques like epitope-mapping as the most straightforward way to address these questions, and studies to resolve these issues on a case-by-case basis are currently underway.</p>
<p>Given the challenges noted above, several lines of evidence support the notion that the computational methods may, nonetheless, provide clues about the nature and location of the epitopes in some cases. For example, fluorescence <italic>Z</italic>-scores obtained under denaturing vs. native conditions (<xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>) suggest that the binding affinity is essentially independent of whether the human protein binder is folded or unfolded, implying that most epitopes are likely to be continuous. We further reasoned that modifying the full-length thermodynamic matching to a more localized thermodynamic matching (e.g., global or local sequence alignments in <italic>FASTA</italic> or <italic>BLAST</italic>) may provide candidates for continuous epitopes. Support for this hypothesis was found by anecdotal inspection of <italic>eScape</italic> &#x394;<italic>G</italic> values for several published sequence-dissimilar cross-reactive auto-immune epitopes (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5A</bold></xref>), which suggested that the local thermodynamic stabilities over 10- to 15-residue (i.e., epitope-sized) sequence fragments could exhibit similarity to the naked eye (although this similarity by itself does not rise to a level of statistical significance).</p>
<p>Armed with these observations, we developed an algorithm to extract optimal local matches from two <italic>eScape</italic> thermodynamic profiles, using only sequence information as input. The resultant <italic>Fragment Vector Comparison</italic> (<italic>FVC</italic>) algorithm calculates the <italic>8xL</italic>-dimensional cosine similarity between all pairwise sets of thermodynamic profiles of a specified window size, <italic>L</italic>, between two proteins (Section 4.6). Thus, a perfect correlation between the thermodynamics of two epitopes would yield an <italic>FVC</italic> score of 1.0, with lesser values indicating poorer matches. The resulting cosine similarities are then sorted, and the best local matches are retrieved.</p>
<p>(The <italic>FVC</italic> package, including <italic>eScape</italic>, is released along with this manuscript, and is freely available at the following site: <ext-link ext-link-type="uri" xlink:href="https://github.com/jBeale23/FragmentVectorComparison">https://github.com/jBeale23/FragmentVectorComparison</ext-link>).</p>
<p>Of note, when this approach was implemented, it was discovered that a majority of published cross-reactive epitopes from medical literature exhibited higher-than-average thermodynamic similarities (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5B</bold></xref>), a statistically significant result (<italic>p</italic> &lt; 0.05). Furthermore, weighting each <italic>e</italic>TFR significance in <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4A</bold></xref> by the fraction of the sequence that scores greater than 0.95 on <italic>FVC</italic> when matched with the viral protein measurably improved the correlation (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>), as well as its significance (<italic>p</italic> = 2 &#xd7; 10<sup>&#x2212;3</sup>). This suggests that optimal local (epitope-sized) thermodynamic similarities, which may be subsumed within the optimal full-length similarities, may play an important role in the relationship between &#x394;<italic>G</italic><sub>conf</sub> and &#x394;<italic>G</italic><sub>total</sub>, perhaps suggestive of a connection between &#x394;<italic>G</italic><sub>conf</sub> and &#x394;<italic>G</italic><sub>int</sub>. Of course, the ultimate validity of this approach awaits additional experiments to determine whether <italic>FVC</italic> can actually predict the locations of the continuous cross-reactive epitopes responsible for <xref ref-type="fig" rid="f3"><bold>Figures&#xa0;3</bold></xref>, <xref ref-type="fig" rid="f4"><bold>4A</bold></xref>. To support such experiments, a list of candidate <italic>FVC</italic> matches for each protein pair in <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref> has been tabulated (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S3</bold></xref>). It would truly be noteworthy if the determinants of the compatibility of a sequence for an ensemble overlapped with the epitope, but this is an open question, and one of the many possibilities requiring future studies.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Simple weighting of <italic>e</italic>TFR significance by fraction of optimal local similarity improves correlation between &#x394;<italic>G</italic><sub>total</sub> and &#x394;<italic>G</italic><sub>conf</sub>. Each point in the scatterplot represents one human protein compared to one virus protein. The <italic>x</italic>-axis plots the computed full-length thermodynamic similarity between the two proteins, which is related to &#x394;<italic>G</italic><sub>conf</sub>, as described in the text (Section 2.2), weighted by the fraction of FVC matches greater than 0.99 contained within the full-length similarity. The <italic>y</italic>-axis plots the experimental fluorescence measured as the human protein binds to the anti-virus protein antibody, which is related to &#x394;<italic>G</italic><sub>total</sub>, as described in the text (Section 2.1). A significant correlation suggests that &#x394;<italic>G</italic><sub>conf</sub> is associated with &#x394;<italic>G</italic><sub>total</sub>. Because this correlation coefficient is improved over <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4A</bold></xref>, this suggests that epitope-sized regions of strongest thermodynamic similarity are important contributors to the correlation (compare with <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4A</bold></xref>).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1749369-g006.tif">
<alt-text content-type="machine-generated">Scatter plot showing the relationship between eTFR significance (negative log p-value times fraction of local matches) on the x-axis and relative antibody binding response (chip Z-score) on the y-axis. The plot features a positive correlation with a regression line, a correlation coefficient of 0.37, and a p-value of 0.002.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Thermodynamic molecular mimicry: source of cross-reactivity?</title>
<p>One common property shared among all documented cross-reactive epitopes in <xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref> is that these medically relevant sequence fragments have undetectable pairwise identity with each other. How could one antibody bind to two epitopes in the absence of sequence similarity? Does a single subpopulation of the polyclonal antibody bind both the virus and human protein, or are there differences in the subpopulations that bind each protein? To explain this conundrum, the well-known phenomenon of molecular mimicry (<xref ref-type="bibr" rid="B34">34</xref>) has been proposed. Many examples of immunologic molecular mimicry have been documented (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B37">37</xref>, <xref ref-type="bibr" rid="B38">38</xref>), with Rojas et&#xa0;al. succinctly listing four distinct types spanning a continuum (<xref ref-type="bibr" rid="B34">34</xref>), ranging from complete structural similarity and sequence identity (Type 1) to structural similarity in the absence of sequence identity (Type 4). The type of molecular mimicry observed here is difficult to classify within this framework, because the common thermodynamic property is neither sequence nor structural in nature. These results suggest that the previously developed TFR scores in conjunction with the newly developed <italic>FVC</italic> matches provide a useful means of investigating the relationship between a more local &#x394;<italic>G</italic><sub>conf</sub> and the &#x394;<italic>G</italic><sub>int</sub> associated with the cross-reactive epitopes. Progress on these questions await epitope mapping studies on numerous systems.</p>
<p>The most general physical interpretation of EMM is that antibodies do not necessarily bind to a unique state, but instead to a subset of thermodynamically similar conformational states within an ensemble (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1A</bold></xref>). Pairs of sequences can, to different extents, populate states that are thermodynamically similar to each other; thus, our hypothesis is that in such cases, antibodies raised to only one sequence can nonetheless bind both, as shown in the schematic model of EMM depicted in <xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>. Importantly, even in the absence of detectable structural similarity in the aligned regions, chemical groups such as hydrophobic side chains or hydrogen bond donors/acceptors would be geometrically placed to permit the same constellation of antibody(ies) to bind both antigens (<xref ref-type="bibr" rid="B37">37</xref>). This is the same principle that allows us to evaluate the preference of an amino acid sequence to adopt one conformation over another simply based on the scoring of amino acids in the corresponding environments of the new conformation without explicit consideration of structural context or interactions (<xref ref-type="bibr" rid="B19">19</xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Ensemble molecular mimicry. <bold>(A)</bold> A viral protein elicits a polyclonal immune response wherein the antibodies recognize specific antigenic sequence elements in the viral protein (red box, dashed border). <bold>(B)</bold> For any given protein (in this case human), there exists a conformational ensemble involving, among other states, those conformations that the antigenic viral sequence adopts (red box, dashed border). Human sequences that are compatible with the viral protein fold (green box, dashed border) will have increased probability of cross-reacting with the corresponding anti-viral antibody.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fimmu-17-1749369-g007.tif">
<alt-text content-type="machine-generated">Diagram showing a process of viral and human protein interaction. Part A illustrates viral protein antigens being processed into a viral protein ensemble, leading to antibody formation. Part B shows human proteins with similar thermodynamic compatibility aligning with the viral ensemble, resulting in antibody cross-reaction with human proteins, labeled &#x201c;Ensemble Molecular Mimicry."</alt-text>
</graphic></fig>
<p>Finally, with regard to medical relevance, the phenomenon of EMM identified here may play a role in unexplained aspects of auto-immunity, such as promiscuous antibodies (<xref ref-type="bibr" rid="B34">34</xref>, <xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B40">40</xref>) or the breaking of immune tolerance in the absence of sequence similarity between self and non-self (<xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B42">42</xref>). However, almost all extant cases of mimicry have been discovered individually in resource-intensive experiments (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B37">37</xref>, <xref ref-type="bibr" rid="B38">38</xref>, <xref ref-type="bibr" rid="B43">43</xref>), motivating the need for cross-reactivity-prediction tools that are less reliant on amino acid sequence identity. It is our hope that the observations reported here, as well as the tools accompanying this manuscript, will provide a new avenue for addressing this need and identifying possible molecular mimicry within a proteome.</p>
</sec>
</sec>
<sec id="s4">
<label>4</label>
<title>Methods</title>
<sec id="s4_1">
<label>4.1</label>
<title>Human proteome-on-a-chip experiments</title>
<p>Rabbit polyclonal IgG primary antibodies raised against purified complete SARS-CoV-2 proteins were purchased off-the-shelf from commercial sources, as described below. Primary antibodies listed below, and in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>, were sent to CDI Laboratories (Baltimore, MD and Mayaguez, PR) and passed over separate <italic>HuProt</italic> chips containing essentially complete representatives of each protein in the human proteome (<italic>HuProt v4.0</italic>, 21,215 distinct amino acid sequences). Binding of antibody to individual proteins was assessed by fluorescence (Alexa 555) of secondary anti-rabbit IgG according to the established procedure of CDI Laboratories. Binding was quantified for each human protein with a <italic>Z</italic>-score, representing the number of standard deviations above or below the average fluorescence signal over the entire chip. Objective analysis reports were received from CDI Laboratories listing the top 10 highest binding human proteins on each chip (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>).</p>
<p>With the exception of the anti-SARS-CoV2-orf10 antibody, two chips were run for each antibody: a &#x201c;native&#x201d; chip, where the proteins on the chip were never exposed to denaturant, and a &#x201c;denatured&#x201d; chip, where the proteins on the chip were exposed to 8 M urea before incubation with the primary antibody. Native and denatured chips were compared to assess the possibility of structured epitopes, and it was found that there was generally a high correlation between native and denatured binding measurements (<xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>). This suggested the lack of widespread structured epitopes, indicating largely redundant information between native and denatured (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>). A technical limitation resulted in the unavailability of denatured binding data for the orf10 experiment. Because of the high correlation between native and denatured observed for the other samples, orf10 native state values were substituted where necessary, without loss of information. However, it is emphasized that this substitution introduces a small but non-negligible source of uncertainty.</p>
<p>Although <italic>HuProt</italic> assays are reported to be reasonably reproducible, we explicitly tested the reproducibility of a separate antibody sample on chips from different batches, 1 year apart. This was polyclonal anti-human CD53 (Bioss Antibodies bs-13625R). The results indicated high correlation between the binding affinities of the two chips under native conditions (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S2</bold></xref>). Therefore, the measurements and conclusions are believed to be robust.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Polyclonal antibodies used</title>
<p>All primary antibodies used here were polyclonal Rabbit IgG from commercial sources, at stock concentrations of 0.1&#x2013;1.0 mg/mL and generally raised against the full-length protein. Manufacturers included anti-SARS-CoV-2-orf9 (Novus Biologicals NBP3-00510), anti-SARS-CoV-2-nsp13 (Life Technologies/Invitrogen PA5120711), anti-SARS-CoV-2-nsp16 (Life Technologies/Invitrogen PA5120701), anti-SARS-CoV-2-Spike (Life Technologies/Invitrogen PA5116916), anti-SARS-CoV-2-orf6 (Life Technologies/Invitrogen PA5120715), anti-SARS-CoV-2-orf8 (Antibodies-Online ABIN7383791), and anti-SARS-CoV-2-orf10 (Antibodies-Online ABIN6952939). These antibodies were chosen based on a preliminary <italic>e</italic>TFR scan of the SARS-CoV-2 proteome against the amino acid sequences of the Protein Data Bank (<xref ref-type="bibr" rid="B2">2</xref>) described below and in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1A</bold></xref>.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Computational methods: eTFR and FASTA alignments</title>
<p>The <italic>e</italic>TFR thermodynamic alignment algorithm was executed as described in previous publications, without modification. In detail, the process was as follows: One full-length virus protein sequence was fed into the <italic>eScape</italic> algorithm as input (included within the <italic>FVC</italic> code released with this manuscript, web app at <italic>best.bio.jhu.edu/eScape</italic>) (<xref ref-type="bibr" rid="B22">22</xref>, <xref ref-type="bibr" rid="B23">23</xref>). The output, two sets of four-dimensional vectors {&#x394;<italic>G</italic>, &#x394;<italic>H</italic><sub>ap</sub>, &#x394;<italic>H</italic><sub>pol</sub>, <italic>T</italic>&#x394;<italic>S</italic><sub>conf</sub>} corresponding to the native state and denatured state thermodynamic descriptors for each residue of the protein, were mapped to the eight native state and eight denatured state thermodynamic environments, as previously described (<xref ref-type="bibr" rid="B44">44</xref>). This information constitutes the complete query thermodynamic profile, and the process was repeated for each virus protein (i.e., the antigen against which each polyclonal was raised).</p>
<p>The workflow proceeded as individual pairwise gapless alignments of each query with the 10 amino acid sequences prioritized by CDI Labs, comparing the shorter of the pair in all possible registers with the longer sequence (<xref ref-type="bibr" rid="B32">32</xref>). Each register was scored by consulting a thermodynamic substitution matrix for each aligned amino acid&#x2013;environment pair and summing the total over the entire alignment (<xref ref-type="bibr" rid="B32">32</xref>). The total score was converted into a significance (<italic>p</italic>-value) according to the null model and length-dependent equation, as described previously (<xref ref-type="bibr" rid="B32">32</xref>). Separate scores and significances were computed for the native state and the denatured state, and the summed negative logs of the native and denatured significances were taken as the total score for that register (<xref ref-type="bibr" rid="B19">19</xref>). Finally, the maximum over all registers was taken as the optimal alignment and significance for that thermodynamic query&#x2013;amino acid sequence pair. (These values are plotted on the <italic>x</italic>-axis of <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref> and are listed in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>.) Thus, for the seven proteins in the SARS-CoV-2 proteome considered, the <italic>e</italic>TFR procedure resulted in two outputs (<xref ref-type="bibr" rid="B1">1</xref>): a pairwise alignment between the virus amino acid sequence and the human sequence (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S2</bold></xref>), and (<xref ref-type="bibr" rid="B2">2</xref>) a significance estimation for that alignment (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>).</p>
<p>Amino acid sequence alignments were performed using the FASTA36 package (<xref ref-type="bibr" rid="B33">33</xref>) and BLOSUM62 substitution matrix (<xref ref-type="bibr" rid="B45">45</xref>), with all default settings. The most significant <italic>E</italic>-value was always taken as the single optimal result between two pairs of proteins; these values are plotted on the <italic>x</italic>-axis of <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4B</bold></xref>.</p>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>Preliminary eTFR scan of the Protein Data Bank</title>
<p>Thermodynamic profiles of the Wuhan-Hu-1 SARS-CoV-2 proteome were computed using <italic>eScape</italic> from the 28 amino acid sequences translated from the NCBI Genomes accession NC_045512.2 (ncbi.nlm.nih.gov). Each of the 28 proteins in the SARS-CoV-2 proteome was used separately as query to exhaustively match all 594,420 amino acid sequences in the Protein Data Bank [download version date 06/14/21, <italic>rcsb.org</italic> (<xref ref-type="bibr" rid="B2">2</xref>)]. In detail, the process was as follows: One virus protein was fed into the <italic>eScape</italic> algorithm as input (included with the <italic>FVC</italic> code released with this manuscript, or web app at <italic>best.bio.jhu.edu/eScape</italic>). The output, two sets of four-dimensional vectors {&#x394;<italic>G</italic>, &#x394;<italic>H</italic><sub>ap</sub>, &#x394;<italic>H</italic><sub>pol</sub>, <italic>T</italic>&#x394;<italic>S</italic><sub>conf</sub>} corresponding to the native state and denatured state thermodynamic descriptors for each residue of the protein, were mapped to the eight native state and eight denatured state thermodynamic environments, as previously described (<xref ref-type="bibr" rid="B44">44</xref>). This information constitutes the complete query thermodynamic profile, and the process was repeated for each virus protein.</p>
<p>The query was then used to exhaustively search a database of all amino acid sequences of known structure, as contained in the Protein Data Bank. The search proceeded as individual pairwise gapless alignments of the query with one amino acid sequence, comparing the shorter of the pair in all possible registers with the longer one (<xref ref-type="bibr" rid="B32">32</xref>). Each register was scored by consulting a thermodynamic substitution matrix for each aligned amino acid&#x2013;environment pair and summing the total over the entire alignment (<xref ref-type="bibr" rid="B32">32</xref>). The total score was converted into a significance (<italic>p</italic>-value) according to the null model and length-dependent equation, as described previously (<xref ref-type="bibr" rid="B32">32</xref>). Separate scores and significances were computed for the native state and the denatured state, and the summed negative logs of the native and denatured-state significances were taken as the total score for that register (<xref ref-type="bibr" rid="B19">19</xref>). Finally, the maximum over all registers was taken as the optimal alignment and significance for that thermodynamic query&#x2013;amino acid sequence pair. These significance values are plotted on the <italic>y</italic>-axis of <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1A</bold></xref>.</p>
<p>The highest-scoring human proteins against each viral protein thermodynamic profile were tabulated by manual inspection (these proteins are indicated by red bars in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1A</bold></xref>). Seven virus&#x2013;human matches were subjectively chosen on the basis of commercial availability of polyclonal antibody raised against the full-length viral protein and commercial availability of purified full-length human protein for Western blot analysis, described in the following. These seven matches chosen for testing are circled and numbered in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1A</bold></xref>. The seven polyclonal antibodies comprised the panel of reagents used for the proteome-on-a-chip experiments shown in <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref> and <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>.</p>
</sec>
<sec id="s4_5">
<label>4.5</label>
<title>Western blot experiments confirming cross-reactivity</title>
<p>Purified protein was obtained from commercial sources, as described below, at concentrations of approximately 0.1&#x2013;1.0 mg/mL. Generally, 10&#x2013;20 &#x3bc;L of this protein was loaded into 12%&#x2013;20% SDS-polyacrylamide Laemmli reducing slab gels to completion at ambient temperature (1 h, 200 V). Electrophoretic transfer to nitrocellulose membrane from the gel was performed under Tris&#x2013;glycine&#x2013;methanol pH 8.3 buffer conditions to completion at 4 &#xb0;C on ice (2 h, 400 A constant current). The membrane was blocked with Blocking Buffer (137 mM NaCl, 20 mM Tris, 0.1% Tween-20, and 5% dry milk, pH 7.6) for 24&#x2013;48 h at 4&#xb0;C. Then, the membrane was incubated with the primary antibody from the list above for at least 1 h at room temperature, washed 3&#xd7; with TBST (137 mM NaCl, 20 mM Tris, and 0.1% Tween-20, pH 7.6), incubated at least 30 min at room temperature with anti-rabbit IgG secondary antibody linked to horseradish peroxidase, and washed 3&#xd7; with TBST. Chemo-luminescence was generated with no more than 24-h-old SignalFire reagents (Cell Signaling Technology, Danvers, MA), according to the manufacturer&#x2019;s directions. Imaging was performed with CL-XPosure film (ThermoFisher Scientific, Baltimore, MD) at a short exposure of 30 s, and again at a long exposure of 2 h. Imaging was also performed in separate experiments with fluorescence scanning after incubation with DyLite 800 PEG 4&#xd7; conjugate secondary antibody, according to the manufacturer&#x2019;s directions (Cell Signaling Technology, Danvers, MA). Images are displayed in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1B</bold></xref>. All cross-reactivity results shown in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1B</bold></xref> were reproducible at least three times.</p>
<p>Primary antibody solutions were generally diluted 1:1,000 in Blocking Buffer, assuming an antibody concentration of approximately 0.1 mg/mL. Secondary antibodies were generally diluted 1:1,000 in Blocking Buffer, assuming an antibody concentration of approximately 0.1 mg/mL. Primary and secondary antibodies were reused for periods of up to 2 weeks, with storage at 4 &#xb0;C and added 0.1% final concentration sodium azide during the intervals.</p>
<p>All proteins used were commercially available at stock concentrations of 0.1&#x2013;1.0 mg/mL and were full length (or the longest length available, subject to coverage of the region of computational prediction). We purchased expected antigens as well as predicted cross-reactive proteins to test the efficacy of the polyclonal antibodies: all polyclonals were judged effective by Western blot analysis (data not shown). Manufacturers from which antigens and proteins were obtained were as follows: SARS-CoV-2-orf9 (R&amp;D Systems/Bio-techne 11033-CV-100), SARS-CoV-2-nsp13 (ProSci 10-427), SARS-CoV-2-nsp16 (ProSci 20-243, N-term uncleaved GST fusion), SARS-CoV-2-Spike (Life Technologies/Invitrogen RP87671, aa16-1213), SARS-CoV-2-orf6 (ProSci 20-193, N-term uncleaved MBP), SARS-CoV-2-orf8 (Life Technologies/Invitrogen RP87666, aa16-121), SARS-CoV-2-orf10 (ProSci 20-189, N-term uncleaved MBP), human-IL11 (Life Technologies/Gibco PHC0115), human-IGLL5 (MyBioSource MBS1029820), human-IL6 (Life Technologies/Invitrogen RP8619), human-SCN4B (OriGene TP323951), human-KDR/VEGFR2 (OriGene TP710248, aa20-764), human-CXCR4 (Abnova H00007852-G01), and human-CD53 (Abnova H00000963-G01).</p>
</sec>
<sec id="s4_6">
<label>4.6</label>
<title>Fragment vector comparison</title>
<p>The python implementation of the <italic>FVC</italic> program was used with all default settings, except that similarity cutoff was set to zero to record all local pairwise comparisons of fragment length <italic>L</italic> between two amino acid sequences. <italic>L</italic> was set to values between 9 and 25 residues long, depending on the length of the published alignment between one pair of cross-reactive epitopes. For each pair of cross-reactive epitopes, all cosine similarity scores computed for length <italic>L</italic> were used as the background distribution to make the box-and-whiskers plots in <xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5B</bold></xref>. The single score corresponding to the fragment of length <italic>L</italic> in the register of the published alignment (i.e., only the documented epitope) was used to plot the red dots in <xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5B</bold></xref>. The source code of <italic>FVC</italic>, which includes the <italic>eScape</italic> algorithm, is released as part of this manuscript, including a C implementation of the cosine similarity calculation that allows for higher throughput on supported device architectures. The code is freely and publicly available at the following site: <ext-link ext-link-type="uri" xlink:href="https://github.com/jBeale23/FragmentVectorComparison">https://github.com/jBeale23/FragmentVectorComparison</ext-link>.</p>
<p>For <xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>, <italic>FVC</italic> was run separately on each of the 70 virus antigen&#x2013;human protein pairs with window size set to 20 and similarity cutoff set to zero. Then, for each virus&#x2013;human pair, only <italic>FVC</italic> scores corresponding to the overlapping windows of the register found in the full-length thermodynamic <italic>e</italic>TFR alignment were retained. Of these <italic>N</italic> scores, a weight <italic>f</italic> was computed from <italic>f</italic> = <italic>M</italic>/<italic>N</italic>, where <italic>M</italic> was the number of scores with cosine similarity greater than 0.95. The <italic>x</italic>-axis of <xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref> was thus computed from <italic>S</italic> &#xd7; <italic>f</italic>, where <italic>S</italic> is the <italic>e</italic>TFR significance (&#x2212;log <italic>p</italic>-value) from <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4A</bold></xref>. Values for <italic>f</italic>, <italic>M</italic>, and <italic>N</italic> obtained are listed in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>. This procedure merely weighted the full-length significance by the fraction of &#x201c;very similar&#x201d; local thermodynamic matches within the full-length alignment.</p>
<p>To facilitate future experiments, a list of the three highest matches of 20 residues found by <italic>FVC</italic> in the context of the full-length <italic>e</italic>TFR alignment between each pair of proteins in <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref> is given in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S3</bold></xref>. Note that these data may also be used to independently check the proper working of a locally installed version of <italic>FVC</italic>.</p>
</sec>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in the <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material</bold></xref>.</p></sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>JW: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Software, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. VH: Conceptualization, Funding acquisition, Project administration, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. JB: Investigation, Methodology, Software, Validation, Writing &#x2013; review &amp; editing. GF: Data curation, Formal analysis, Methodology, Software, Writing &#x2013; review &amp; editing. AM: Conceptualization, Data curation, Formal analysis, Writing &#x2013; review &amp; editing.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>We thank Sara Rahman, Aria Heidsek and Buffy Wrabl for assistance and discussions.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s9" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fimmu.2026.1749369/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fimmu.2026.1749369/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.pdf" id="SM1" mimetype="application/pdf"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Madsen</surname> <given-names>AV</given-names></name>
<name><surname>Mejias-Gomez</surname> <given-names>O</given-names></name>
<name><surname>Pedersen</surname> <given-names>LE</given-names></name>
<name><surname>Preben Morth</surname> <given-names>J</given-names></name>
<name><surname>Kristensen</surname> <given-names>P</given-names></name>
<name><surname>Jenkins</surname> <given-names>TP</given-names></name>
<etal/>
</person-group>. 
<article-title>Structural trends in antibody-antigen binding interfaces: a computational analysis of 1833 experimentally determined 3D structures</article-title>. <source>Comput Struct Biotechnol J</source>. (<year>2024</year>) <volume>23</volume>:<fpage>199</fpage>&#x2013;<lpage>211</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.csbj.2023.11.056</pub-id>, PMID: <pub-id pub-id-type="pmid">38161735</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<label>2</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Burley</surname> <given-names>SK</given-names></name>
<name><surname>Berman</surname> <given-names>HM</given-names></name>
<name><surname>Duarte</surname> <given-names>JM</given-names></name>
<name><surname>Feng</surname> <given-names>Z</given-names></name>
<name><surname>Flatt</surname> <given-names>JW</given-names></name>
<name><surname>Hudson</surname> <given-names>BP</given-names></name>
<etal/>
</person-group>. 
<article-title>Protein data bank: A comprehensive review of 3D structure holdings and worldwide utilization by researchers, educators, and students</article-title>. <source>Biomolecules</source>. (<year>2022</year>) <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/biom12101425</pub-id>, PMID: <pub-id pub-id-type="pmid">36291635</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<label>3</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Childers</surname> <given-names>MC</given-names></name>
<name><surname>Daggett</surname> <given-names>V</given-names></name>
</person-group>. 
<article-title>Molecular dynamics methods for antibody design</article-title>. <source>Methods Mol Biol</source>. (<year>2023</year>) <volume>2552</volume>:<page-range>109&#x2013;24</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-0716-2609-2_5</pub-id>, PMID: <pub-id pub-id-type="pmid">36346588</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<label>4</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jeliazkov</surname> <given-names>JR</given-names></name>
<name><surname>Frick</surname> <given-names>R</given-names></name>
<name><surname>Zhou</surname> <given-names>J</given-names></name>
<name><surname>Gray</surname> <given-names>JJ</given-names></name>
</person-group>. 
<article-title>Robustification of rosettaAntibody and rosetta snugDock</article-title>. <source>PloS One</source>. (<year>2021</year>) <volume>16</volume>:<fpage>e0234282</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0234282</pub-id>, PMID: <pub-id pub-id-type="pmid">33764990</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<label>5</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kenlay</surname> <given-names>H</given-names></name>
<name><surname>Dreyer</surname> <given-names>FA</given-names></name>
<name><surname>Kovaltsuk</surname> <given-names>A</given-names></name>
<name><surname>Miketa</surname> <given-names>D</given-names></name>
<name><surname>Pires</surname> <given-names>D</given-names></name>
<name><surname>Deane</surname> <given-names>CM</given-names></name>
</person-group>. 
<article-title>Large scale paired antibody language models</article-title>. <source>PloS Comput Biol</source>. (<year>2024</year>) <volume>20</volume>:<fpage>e1012646</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pcbi.1012646</pub-id>, PMID: <pub-id pub-id-type="pmid">39642174</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<label>6</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Joubbi</surname> <given-names>S</given-names></name>
<name><surname>Micheli</surname> <given-names>A</given-names></name>
<name><surname>Milazzo</surname> <given-names>P</given-names></name>
<name><surname>Maccari</surname> <given-names>G</given-names></name>
<name><surname>Ciano</surname> <given-names>G</given-names></name>
<name><surname>Cardamone</surname> <given-names>D</given-names></name>
<etal/>
</person-group>. 
<article-title>Antibody design using deep learning: from sequence and structure design to affinity maturation</article-title>. <source>Brief Bioinform</source>. (<year>2024</year>) <volume>25</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bib/bbae307</pub-id>, PMID: <pub-id pub-id-type="pmid">38960409</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<label>7</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bennett</surname> <given-names>NR</given-names></name>
<name><surname>Watson</surname> <given-names>JL</given-names></name>
<name><surname>Ragotte</surname> <given-names>RJ</given-names></name>
<name><surname>Borst</surname> <given-names>AJ</given-names></name>
<name><surname>See</surname> <given-names>DL</given-names></name>
<name><surname>Weidle</surname> <given-names>C</given-names></name>
<etal/>
</person-group>. 
<article-title>Atomically accurate de novo design of antibodies with RFdiffusion</article-title>. <source>Nature</source>. (<year>2025</year>) <volume>649</volume>:<page-range>183&#x2013;93</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2024.03.14.585103</pub-id>, PMID: <pub-id pub-id-type="pmid">38562682</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<label>8</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hummer</surname> <given-names>AM</given-names></name>
<name><surname>Schneider</surname> <given-names>C</given-names></name>
<name><surname>Chinery</surname> <given-names>L</given-names></name>
<name><surname>Deane</surname> <given-names>CM</given-names></name>
</person-group>. 
<article-title>Investigating the volume and diversity of data needed for generalizable antibody-antigen DeltaDeltaG prediction</article-title>. <source>Nat Comput Sci</source>. (<year>2025</year>) <volume>5</volume>:<page-range>635&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s43588-025-00823-8</pub-id>, PMID: <pub-id pub-id-type="pmid">40629090</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<label>9</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sachs</surname> <given-names>DH</given-names></name>
<name><surname>Schechter</surname> <given-names>AN</given-names></name>
<name><surname>Eastlake</surname> <given-names>A</given-names></name>
<name><surname>Anfinsen</surname> <given-names>CB</given-names></name>
</person-group>. 
<article-title>An immunologic approach to the conformational equilibria of polypeptides</article-title>. <source>Proc Natl Acad Sci U S A</source>. (<year>1972</year>) <volume>69</volume>:<page-range>3790&#x2013;4</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.69.12.3790</pub-id>, PMID: <pub-id pub-id-type="pmid">4118873</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<label>10</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Furie</surname> <given-names>B</given-names></name>
<name><surname>Schechter</surname> <given-names>AN</given-names></name>
<name><surname>Sachs</surname> <given-names>DH</given-names></name>
<name><surname>Anfinsen</surname> <given-names>CB</given-names></name>
</person-group>. 
<article-title>An immunological approach to the conformational equilibrium of staphylococcal nuclease</article-title>. <source>J Mol Biol</source>. (<year>1975</year>) <volume>92</volume>:<fpage>497</fpage>&#x2013;<lpage>506</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0022-2836(75)90305-8</pub-id>, PMID: <pub-id pub-id-type="pmid">1171246</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<label>11</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kohm</surname> <given-names>AP</given-names></name>
<name><surname>Fuller</surname> <given-names>KG</given-names></name>
<name><surname>Miller</surname> <given-names>SD</given-names></name>
</person-group>. 
<article-title>Mimicking the way to autoimmunity: an evolving theory of sequence and structural homology</article-title>. <source>Trends Microbiol</source>. (<year>2003</year>) <volume>11</volume>:<page-range>101&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0966-842X(03)00006-4</pub-id>, PMID: <pub-id pub-id-type="pmid">12648936</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<label>12</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>EY</given-names></name>
<name><surname>Mao</surname> <given-names>T</given-names></name>
<name><surname>Klein</surname> <given-names>J</given-names></name>
<name><surname>Dai</surname> <given-names>Y</given-names></name>
<name><surname>Huck</surname> <given-names>JD</given-names></name>
<name><surname>Jaycox</surname> <given-names>JR</given-names></name>
<etal/>
</person-group>. 
<article-title>Diverse functional autoantibodies in patients with COVID-19</article-title>. <source>Nature</source>. (<year>2021</year>) <volume>595</volume>:<page-range>283&#x2013;8</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-021-03631-y</pub-id>, PMID: <pub-id pub-id-type="pmid">34010947</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<label>13</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>EY</given-names></name>
<name><surname>Dai</surname> <given-names>Y</given-names></name>
<name><surname>Rosen</surname> <given-names>CE</given-names></name>
<name><surname>Schmitt</surname> <given-names>MM</given-names></name>
<name><surname>Dong</surname> <given-names>MX</given-names></name>
<name><surname>Ferre</surname> <given-names>EMN</given-names></name>
<etal/>
</person-group>. 
<article-title>High-throughput identification of autoantibodies that target the human exoproteome</article-title>. <source>Cell Rep Methods</source>. (<year>2022</year>) <volume>2</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.crmeth.2022.100172</pub-id>, PMID: <pub-id pub-id-type="pmid">35360706</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<label>14</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Song</surname> <given-names>Y</given-names></name>
<name><surname>Li</surname> <given-names>J</given-names></name>
<name><surname>Wu</surname> <given-names>Y</given-names></name>
</person-group>. 
<article-title>Evolving understanding of autoimmune mechanisms and new therapeutic strategies of autoimmune disorders</article-title>. <source>Signal Transduct Target Ther</source>. (<year>2024</year>) <volume>9</volume>:<fpage>263</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41392-024-01952-8</pub-id>, PMID: <pub-id pub-id-type="pmid">39362875</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<label>15</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Laver</surname> <given-names>WG</given-names></name>
<name><surname>Air</surname> <given-names>GM</given-names></name>
<name><surname>Webster</surname> <given-names>RG</given-names></name>
<name><surname>Smith-Gill</surname> <given-names>SJ</given-names></name>
</person-group>. 
<article-title>Epitopes on protein antigens: misconceptions and realities</article-title>. <source>Cell</source>. (<year>1990</year>) <volume>61</volume>:<page-range>553&#x2013;6</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0092-8674(90)90464-P</pub-id>, PMID: <pub-id pub-id-type="pmid">1693095</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<label>16</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Benjamin</surname> <given-names>DC</given-names></name>
<name><surname>Berzofsky</surname> <given-names>JA</given-names></name>
<name><surname>East</surname> <given-names>IJ</given-names></name>
<name><surname>Gurd</surname> <given-names>FR</given-names></name>
<name><surname>Hannum</surname> <given-names>C</given-names></name>
<name><surname>Leach</surname> <given-names>SJ</given-names></name>
<etal/>
</person-group>. 
<article-title>The antigenic structure of proteins: a reappraisal</article-title>. <source>Annu Rev Immunol</source>. (<year>1984</year>) <volume>2</volume>:<fpage>67</fpage>&#x2013;<lpage>101</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.iy.02.040184.000435</pub-id>, PMID: <pub-id pub-id-type="pmid">6085753</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<label>17</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tsuboyama</surname> <given-names>K</given-names></name>
<name><surname>Dauparas</surname> <given-names>J</given-names></name>
<name><surname>Chen</surname> <given-names>J</given-names></name>
<name><surname>Laine</surname> <given-names>E</given-names></name>
<name><surname>Mohseni Behbahani</surname> <given-names>Y</given-names></name>
<name><surname>Weinstein</surname> <given-names>JJ</given-names></name>
<etal/>
</person-group>. 
<article-title>Mega-scale experimental analysis of protein folding stability in biology and design</article-title>. <source>Nature</source>. (<year>2023</year>) <volume>620</volume>:<page-range>434&#x2013;44</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-023-06328-6</pub-id>, PMID: <pub-id pub-id-type="pmid">37468638</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<label>18</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Escobedo</surname> <given-names>A</given-names></name>
<name><surname>Voigt</surname> <given-names>G</given-names></name>
<name><surname>Faure</surname> <given-names>AJ</given-names></name>
<name><surname>Lehner</surname> <given-names>B</given-names></name>
</person-group>. 
<article-title>Genetics, energetics, and allostery in proteins with randomized cores and surfaces</article-title>. <source>Science</source>. (<year>2025</year>) <volume>389</volume>:<fpage>eadq3948</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.adq3948</pub-id>, PMID: <pub-id pub-id-type="pmid">40705891</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<label>19</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Voortman-Sheetz</surname> <given-names>K</given-names></name>
<name><surname>Wrabl</surname> <given-names>JO</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>Impact of local unfolding fluctuations on the evolution of regional sequence preferences in proteins</article-title>. <source>Protein Sci</source>. (<year>2025</year>) <volume>34</volume>:<fpage>e70015</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/pro.70015</pub-id>, PMID: <pub-id pub-id-type="pmid">39969063</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<label>20</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Millard</surname> <given-names>CEF</given-names></name>
<name><surname>Wrabl</surname> <given-names>JO</given-names></name>
<name><surname>Brantley</surname> <given-names>SJ</given-names></name>
<name><surname>Grasso</surname> <given-names>E</given-names></name>
<name><surname>Schmitz</surname> <given-names>A</given-names></name>
<name><surname>White</surname> <given-names>JT</given-names></name>
<etal/>
</person-group>. 
<article-title>The ensemble basis of allostery and function: insights from models of local unfolding</article-title>. <source>J Mol Biol</source>. (<year>2025</year>) <volume>437</volume>:<fpage>169287</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jmb.2025.169287</pub-id>, PMID: <pub-id pub-id-type="pmid">40499749</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<label>21</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
<name><surname>Wrabl</surname> <given-names>JO</given-names></name>
<name><surname>Millard</surname> <given-names>CEF</given-names></name>
<name><surname>Schmitz</surname> <given-names>A</given-names></name>
<name><surname>Brantley</surname> <given-names>SJ</given-names></name>
<name><surname>Pearce</surname> <given-names>M</given-names></name>
<etal/>
</person-group>. 
<article-title>Statistical thermodynamics of the protein ensemble: mediating function and evolution</article-title>. <source>Annu Rev Biophys</source>. (<year>2025</year>) <volume>54</volume>:<page-range>227&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev-biophys-061824-104900</pub-id>, PMID: <pub-id pub-id-type="pmid">39929551</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<label>22</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gu</surname> <given-names>J</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>Predicting the energetics of conformational fluctuations in proteins from sequence: a strategy for profiling the proteome</article-title>. <source>Structure</source>. (<year>2008</year>) <volume>16</volume>:<page-range>1627&#x2013;37</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.str.2008.08.016</pub-id>, PMID: <pub-id pub-id-type="pmid">19000815</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<label>23</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gu</surname> <given-names>J</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>Sequence-based analysis of protein energy landscapes reveals nonuniform thermal adaptation within the proteome</article-title>. <source>Mol Biol Evol</source>. (<year>2009</year>) <volume>26</volume>:<page-range>2217&#x2013;27</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msp140</pub-id>, PMID: <pub-id pub-id-type="pmid">19592668</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<label>24</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Onuchic</surname> <given-names>JN</given-names></name>
<name><surname>Luthey-Schulten</surname> <given-names>Z</given-names></name>
<name><surname>Wolynes</surname> <given-names>PG</given-names></name>
</person-group>. 
<article-title>Theory of protein folding: the energy landscape perspective</article-title>. <source>Annu Rev Phys Chem</source>. (<year>1997</year>) <volume>48</volume>:<fpage>545</fpage>&#x2013;<lpage>600</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.physchem.48.1.545</pub-id>, PMID: <pub-id pub-id-type="pmid">9348663</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<label>25</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
<name><surname>Garcia-Moreno</surname> <given-names>EB</given-names></name>
<name><surname>Oas</surname> <given-names>TG</given-names></name>
<name><surname>Kapp</surname> <given-names>G</given-names></name>
<name><surname>Whitten</surname> <given-names>ST</given-names></name>
</person-group>. 
<article-title>A statistical thermodynamic model of the protein ensemble</article-title>. <source>Chem Rev</source>. (<year>2006</year>) <volume>106</volume>:<page-range>1545&#x2013;58</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/cr040423+</pub-id>, PMID: <pub-id pub-id-type="pmid">16683744</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<label>26</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wand</surname> <given-names>AJ</given-names></name>
</person-group>. 
<article-title>Deep mining of the protein energy landscape</article-title>. <source>Struct Dyn</source>. (<year>2023</year>) <volume>10</volume>:<fpage>020901</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1063/4.0000180</pub-id>, PMID: <pub-id pub-id-type="pmid">37124940</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<label>27</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wrabl</surname> <given-names>JO</given-names></name>
<name><surname>Larson</surname> <given-names>SA</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>Thermodynamic environments in proteins: fundamental determinants of fold specificity</article-title>. <source>Protein Sci</source>. (<year>2002</year>) <volume>11</volume>:<page-range>1945&#x2013;57</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1110/ps.0203202</pub-id>, PMID: <pub-id pub-id-type="pmid">12142449</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<label>28</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Larson</surname> <given-names>SA</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>Analysis of the &#x201c;thermodynamic information content&#x201d; of a Homo sapiens structural database reveals hierarchical thermodynamic organization</article-title>. <source>Protein Sci</source>. (<year>2004</year>) <volume>13</volume>:<page-range>1787&#x2013;801</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1110/ps.04706204</pub-id>, PMID: <pub-id pub-id-type="pmid">15215522</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<label>29</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>S</given-names></name>
<name><surname>Gu</surname> <given-names>J</given-names></name>
<name><surname>Larson</surname> <given-names>SA</given-names></name>
<name><surname>Whitten</surname> <given-names>ST</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>Denatured-state energy landscapes of a protein structural database reveal the energetic determinants of a framework model for folding</article-title>. <source>J Mol Biol</source>. (<year>2008</year>) <volume>381</volume>:<page-range>1184&#x2013;201</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jmb.2008.06.046</pub-id>, PMID: <pub-id pub-id-type="pmid">18616947</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<label>30</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Vertrees</surname> <given-names>J</given-names></name>
<name><surname>Wrabl</surname> <given-names>JO</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>Energetic profiling of protein folds</article-title>. <source>Methods Enzymol</source>. (<year>2009</year>) <volume>455</volume>:<fpage>299</fpage>&#x2013;<lpage>327</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0076-6879(08)04211-0</pub-id>, PMID: <pub-id pub-id-type="pmid">19289211</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<label>31</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wrabl</surname> <given-names>JO</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>Investigating homology between proteins using energetic profiles</article-title>. <source>PloS Comput Biol</source>. (<year>2010</year>) <volume>6</volume>:<fpage>e1000722</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pcbi.1000722</pub-id>, PMID: <pub-id pub-id-type="pmid">20361049</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<label>32</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hoffmann</surname> <given-names>J</given-names></name>
<name><surname>Wrabl</surname> <given-names>JO</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>The role of negative selection in protein evolution revealed through the energetics of the native state ensemble</article-title>. <source>Proteins</source>. (<year>2016</year>) <volume>84</volume>:<page-range>435&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/prot.24989</pub-id>, PMID: <pub-id pub-id-type="pmid">26800099</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<label>33</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pearson</surname> <given-names>WR</given-names></name>
</person-group>. 
<article-title>Finding protein and nucleotide similarities with FASTA</article-title>. <source>Curr Protoc Bioinf</source>. (<year>2016</year>) <volume>53</volume>:<fpage>3 9 1</fpage>&#x2013;<lpage>3 9 25</lpage>.
</mixed-citation>
</ref>
<ref id="B34">
<label>34</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rojas</surname> <given-names>M</given-names></name>
<name><surname>Herran</surname> <given-names>M</given-names></name>
<name><surname>Ramirez-Santana</surname> <given-names>C</given-names></name>
<name><surname>Leung</surname> <given-names>PSC</given-names></name>
<name><surname>Anaya</surname> <given-names>JM</given-names></name>
<name><surname>Ridgway</surname> <given-names>WM</given-names></name>
<etal/>
</person-group>. 
<article-title>Molecular mimicry and autoimmunity in the time of COVID-19</article-title>. <source>J Autoimmun</source>. (<year>2023</year>) <volume>139</volume>:<fpage>103070</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jaut.2023.103070</pub-id>, PMID: <pub-id pub-id-type="pmid">37390745</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<label>35</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lee</surname> <given-names>J</given-names></name>
<name><surname>Seok</surname> <given-names>C</given-names></name>
<name><surname>Ham</surname> <given-names>S</given-names></name>
<name><surname>Chong</surname> <given-names>SH</given-names></name>
</person-group>. 
<article-title>Atomic-level thermodynamics analysis of the binding free energy of SARS-CoV-2 neutralizing antibodies</article-title>. <source>Proteins</source>. (<year>2023</year>) <volume>91</volume>:<fpage>694</fpage>&#x2013;<lpage>704</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/prot.26458</pub-id>, PMID: <pub-id pub-id-type="pmid">36564921</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<label>36</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Clark</surname> <given-names>AJ</given-names></name>
<name><surname>Gindin</surname> <given-names>T</given-names></name>
<name><surname>Zhang</surname> <given-names>B</given-names></name>
<name><surname>Wang</surname> <given-names>L</given-names></name>
<name><surname>Abel</surname> <given-names>R</given-names></name>
<name><surname>Murret</surname> <given-names>CS</given-names></name>
<etal/>
</person-group>. 
<article-title>Free energy perturbation calculation of relative binding free energy between broadly neutralizing antibodies and the gp120 glycoprotein of HIV-1</article-title>. <source>J Mol Biol</source>. (<year>2017</year>) <volume>429</volume>:<page-range>930&#x2013;47</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jmb.2016.11.021</pub-id>, PMID: <pub-id pub-id-type="pmid">27908641</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<label>37</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Quaratino</surname> <given-names>S</given-names></name>
<name><surname>Thorpe</surname> <given-names>CJ</given-names></name>
<name><surname>Travers</surname> <given-names>PJ</given-names></name>
<name><surname>Londei</surname> <given-names>M</given-names></name>
</person-group>. 
<article-title>Similar antigenic surfaces, rather than sequence homology, dictate T-cell epitope molecular mimicry</article-title>. <source>Proc Natl Acad Sci U S A</source>. (<year>1995</year>) <volume>92</volume>:<page-range>10398&#x2013;402</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.92.22.10398</pub-id>, PMID: <pub-id pub-id-type="pmid">7479792</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<label>38</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jog</surname> <given-names>NR</given-names></name>
<name><surname>McClain</surname> <given-names>MT</given-names></name>
<name><surname>Heinlen</surname> <given-names>LD</given-names></name>
<name><surname>Gross</surname> <given-names>T</given-names></name>
<name><surname>Towner</surname> <given-names>R</given-names></name>
<name><surname>Guthridge</surname> <given-names>JM</given-names></name>
<etal/>
</person-group>. 
<article-title>Epstein Barr virus nuclear antigen 1 (EBNA-1) peptides recognized by adult multiple sclerosis patient sera induce neurologic symptoms in a murine model</article-title>. <source>J Autoimmun</source>. (<year>2020</year>) <volume>106</volume>:<fpage>102332</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jaut.2019.102332</pub-id>, PMID: <pub-id pub-id-type="pmid">31515129</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<label>39</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>James</surname> <given-names>LC</given-names></name>
<name><surname>Roversi</surname> <given-names>P</given-names></name>
<name><surname>Tawfik</surname> <given-names>DS</given-names></name>
</person-group>. 
<article-title>Antibody multispecificity mediated by conformational diversity</article-title>. <source>Science</source>. (<year>2003</year>) <volume>299</volume>:<page-range>1362&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1079731</pub-id>, PMID: <pub-id pub-id-type="pmid">12610298</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<label>40</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Van Regenmortel</surname> <given-names>MH</given-names></name>
</person-group>. 
<article-title>Specificity, polyspecificity, and heterospecificity of antibody-antigen recognition</article-title>. <source>J Mol Recognit</source>. (<year>2014</year>) <volume>27</volume>:<page-range>627&#x2013;39</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/jmr.2394</pub-id>, PMID: <pub-id pub-id-type="pmid">25277087</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<label>41</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Koncz</surname> <given-names>B</given-names></name>
<name><surname>Balogh</surname> <given-names>GM</given-names></name>
<name><surname>Manczinger</surname> <given-names>M</given-names></name>
</person-group>. 
<article-title>A journey to your self: The vague definition of immune self and its practical implications</article-title>. <source>Proc Natl Acad Sci U S A</source>. (<year>2024</year>) <volume>121</volume>:<fpage>e2309674121</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2309674121</pub-id>, PMID: <pub-id pub-id-type="pmid">38722806</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<label>42</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Medzhitov</surname> <given-names>R</given-names></name>
<name><surname>Iwasaki</surname> <given-names>A</given-names></name>
</person-group>. 
<article-title>Exploring new perspectives in immunology</article-title>. <source>Cell</source>. (<year>2024</year>) <volume>187</volume>:<page-range>2079&#x2013;94</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2024.03.038</pub-id>, PMID: <pub-id pub-id-type="pmid">38670066</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<label>43</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Robinson</surname> <given-names>WH</given-names></name>
<name><surname>Steinman</surname> <given-names>L</given-names></name>
</person-group>. 
<article-title>Epstein-Barr virus and multiple sclerosis</article-title>. <source>Science</source>. (<year>2022</year>) <volume>375</volume>:<page-range>264&#x2013;5</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.abm7930</pub-id>, PMID: <pub-id pub-id-type="pmid">35025606</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<label>44</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chin</surname> <given-names>AF</given-names></name>
<name><surname>Wrabl</surname> <given-names>JO</given-names></name>
<name><surname>Hilser</surname> <given-names>VJ</given-names></name>
</person-group>. 
<article-title>A thermodynamic atlas of proteomes reveals energetic innovation across the tree of life</article-title>. <source>Mol Biol Evol</source>. (<year>2022</year>) <volume>39</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msac010</pub-id>, PMID: <pub-id pub-id-type="pmid">35038744</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<label>45</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Henikoff</surname> <given-names>S</given-names></name>
<name><surname>Henikoff</surname> <given-names>JG</given-names></name>
</person-group>. 
<article-title>Amino acid substitution matrices from protein blocks</article-title>. <source>Proc Natl Acad Sci U S A</source>. (<year>1992</year>) <volume>89</volume>:<page-range>10915&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.89.22.10915</pub-id>, PMID: <pub-id pub-id-type="pmid">1438297</pub-id>
</mixed-citation>
</ref>
<ref id="B46">
<label>46</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mathieu</surname> <given-names>PA</given-names></name>
<name><surname>Gomez</surname> <given-names>KA</given-names></name>
<name><surname>Coutelier</surname> <given-names>JP</given-names></name>
<name><surname>Retegui</surname> <given-names>LA</given-names></name>
</person-group>. 
<article-title>Sequence similarity and structural homologies are involved in the autoimmune response elicited by mouse hepatitis virus A59</article-title>. <source>J Autoimmun</source>. (<year>2004</year>) <volume>23</volume>:<page-range>117&#x2013;26</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jaut.2004.05.006</pub-id>, PMID: <pub-id pub-id-type="pmid">15324930</pub-id>
</mixed-citation>
</ref>
<ref id="B47">
<label>47</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bodansky</surname> <given-names>A</given-names></name>
<name><surname>Mettelman</surname> <given-names>RC</given-names></name>
<name><surname>Sabatino</surname> <given-names>JJ</given-names> <suffix>Jr.</suffix></name>
<name><surname>Vazquez</surname> <given-names>SE</given-names></name>
<name><surname>Chou</surname> <given-names>J</given-names></name>
<name><surname>Novak</surname> <given-names>T</given-names></name>
<etal/>
</person-group>. 
<article-title>Molecular mimicry in multisystem inflammatory syndrome in children</article-title>. <source>Nature</source>. (<year>2024</year>) <volume>632</volume>:<page-range>622&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-024-07722-4</pub-id>, PMID: <pub-id pub-id-type="pmid">39112696</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/552616">Jefferson Russo Victor</ext-link>, School of Medicine - University of S&#xe3;o Paulo (FM-USP), Brazil</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1664179">Ashish Kumar Agrahari</ext-link>, Clemson University, United States</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3297778">Jerome Anthony E. Alvarez</ext-link>, George Mason University, United States</p></fn>
</fn-group>
</back>
</article>