<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article article-type="methods-article" dtd-version="1.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1770157</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2026.1770157</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Methods</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Quantum chemical profiling of protein mutations via fragment-based DFT</article-title>
<alt-title alt-title-type="left-running-head">Leyva and Niazi</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fmolb.2026.1770157">10.3389/fmolb.2026.1770157</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Leyva</surname>
<given-names>Alejandro</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/3320803"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal Analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Niazi</surname>
<given-names>M. Khalid Khan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
</contrib>
</contrib-group>
<aff id="aff1">
<label>1</label>
<institution>Department of Biomedical Engineering, The Ohio State University</institution>, <city>Columbus</city>, <state>OH</state>, <country country="US">United States</country>
</aff>
<aff id="aff2">
<label>2</label>
<institution>Department of Pathology, The Ohio State University</institution>, <city>Columbus</city>, <state>OH</state>, <country country="US">United States</country>
</aff>
<author-notes>
<corresp id="c001">
<label>&#x2a;</label>Correspondence: Alejandro Leyva, <email xlink:href="mailto:aleyva14@outlook.com">aleyva14@outlook.com</email>; M. Khalid Khan, <email xlink:href="mailto:khalid.niazi@osumc.edu">khalid.niazi@osumc.edu</email>
</corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-18">
<day>18</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>13</volume>
<elocation-id>1770157</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>21</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Leyva and Niazi.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Leyva and Niazi</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-18">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Missense mutations have been extensively studied in tumor-suppressing antigens (TP53) to understand oncogenesis within malignant epithelial cells. Using Whole Exome Sequencing (WXS), missense mutations can be profiled into protein sequences to identify the most common variants in tumor samples. Since most mutations arise randomly, it is necessary to isolate those that produce dysfunctional proteins within large cohorts. Using threading and generative algorithms such as AlphaFold and ColabFold, large cohorts of WXS information can be converted into computationally analyzable structures. By evaluating both high- and low-confidence regions in these structures, these antigens can be studied en masse using pipelines that generate analytical inputs for quantum chemistry analysis. We created a pipeline that processed whole-exome sequencing (WXS) data and selected 28 representative TP53 missense mutants from the TCGA-BRCA cohort for quantum-chemical feasibility analysis. These structures were systematically cleaned using tools such as OpenBabel and AmberTools, and each was prepared for Natural Population Analysis (NPA), Electrostatic Potential (ESP) calculations, and Highest and Lowest Occupied Molecular Orbital (HOMO/LUMO) evaluation within Q-Chem. Using this pipeline, population genomics can be integrated with chemoinformatics to analyze electron density concentrations and generate hypothesis-generating electronic descriptors associated with protein dysfunction. By modifying the generated inputs, additional analyses such as Fukui orbitals, chemical shifts, and Raman shifts can also be performed. This provides a computational means to probe electronic properties not readily accessible at scale using experimental techniques.</p>
</abstract>
<kwd-group>
<kwd>AlphaFold</kwd>
<kwd>genomics</kwd>
<kwd>quantum chemistry</kwd>
<kwd>structural biology</kwd>
<kwd>whole exome sequencing</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. The project described was supported in part by R01 CA276301 (PIs: Niazi and Chen) from the National Cancer Institute, Pelatonia under IRP CC13702 (PIs: Niazi, Vilgelm, and Roy), The Ohio State University Department of Pathology and Comprehensive Cancer Center. The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Cancer Institute or National Institutes of Health or The Ohio State University.</funding-statement>
</funding-group>
<counts>
<fig-count count="10"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="32"/>
<page-count count="00"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Biological Modeling and Simulation</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>The TP53 gene is a multi-domain transcription factor responsible for producing antigens that regulate apoptosis, cell cycles, autophagy, metabolism, and DNA repair (<xref ref-type="bibr" rid="B17">Joerger and Alan, 2008</xref>; <xref ref-type="bibr" rid="B19">Kastenhuber and Lowe, 2017</xref>). Within the 393-amino-acid protein, DNA binding occurs through residues 92&#x2013;292, producing upregulation or downregulation of specific cascades (<xref ref-type="bibr" rid="B6">Cho et al., 1994</xref>).</p>
<p>The tetramerization domain in residues 323&#x2013;356 is composed of a beta strand (326&#x2013;333), followed by alpha-helical regions (335&#x2013;355) that form a tetrameric structure connecting the domains of the p53 protein to form a dimer of dimers (<xref ref-type="bibr" rid="B7">Clore et al., 1994</xref>, <xref ref-type="bibr" rid="B24">Miller et al., 1999</xref>, <xref ref-type="bibr" rid="B32">Wang et al., 1994</xref>; <xref ref-type="bibr" rid="B22">Lalli et al., 2025</xref>). The hydrophobic core formed from isoleucine and leucine produces packing interactions around the region, creating the coordinative ability for conformational changes sequential to DNA binding (<xref ref-type="bibr" rid="B7">Clore et al., 1994</xref>, <xref ref-type="bibr" rid="B24">Miller et al., 1999</xref>, <xref ref-type="bibr" rid="B32">Wang et al., 1994</xref>; <xref ref-type="bibr" rid="B22">Lalli et al., 2025</xref>). Thr329 and Gly334 form the bridging strand between the beta strand and the alpha-helical region. Arginine and lysine residues at positions 337 and 351 stabilize the salt bridge between asparagine and arginine that corrects the orientation of the alpha helix. The surface of the alpha helices is covered by hydrophobic residues, including phenylalanine, leucine, isoleucine, and alanine. Orientation and parallelism of the helices are coordinated using isoleucine and leucine hydrogen bonds between amines. This produces a combination of van der Waals contacts between leucine and histidine, while forming side-chain interactions between leucine and isoleucine, with glycine residues orienting the angular position of the helix at a 40-degree angle for symmetry. Certain mutations target the salt bridge or hydrophobic packing, preventing transcriptional activation and dimerization of p53 molecules (<xref ref-type="bibr" rid="B5">Bullock and Fersht, 2001</xref>; <xref ref-type="bibr" rid="B16">Hulboy and Lozano, 1994</xref>).</p>
<p>The first 93 residues of p53 form transactivation domains 1 and 2, and the proline-rich region (62&#x2013;93) (<xref ref-type="bibr" rid="B15">Hu et al., 2006</xref>; <xref ref-type="bibr" rid="B21">Kussie et al., 1996</xref>; <xref ref-type="bibr" rid="B20">Kohn and Yves, 2005</xref>; <xref ref-type="bibr" rid="B8">Dyson and Wright, 2024</xref>; <xref ref-type="bibr" rid="B3">Beaucage and Caruthers, 1981</xref>). TAD1 contains residues allowing for phosphorylation, while TAD2 contains short alpha-helical strands that allow transcriptional activation of PUMA, NOXA, and BAX (<xref ref-type="bibr" rid="B15">Hu et al., 2006</xref>; <xref ref-type="bibr" rid="B21">Kussie et al., 1996</xref>; <xref ref-type="bibr" rid="B20">Kohn and Yves, 2005</xref>; <xref ref-type="bibr" rid="B8">Dyson and Wright, 2024</xref>; <xref ref-type="bibr" rid="B3">Beaucage and Caruthers, 1981</xref>). The proline-rich region is polymorphic, containing PXXP motifs that enable protein binding. Finally, the C-terminal regulatory domain contains large clusters of lysines for ubiquitination, methylation, and acetylation.</p>
<p>Using whole-exome sequencing, extracted DNA from cell lines can be enzymatically fragmented and biotinylated, allowing identification of protein-coding regions (<xref ref-type="bibr" rid="B3">Beaucage and Caruthers, 1981</xref>; <xref ref-type="bibr" rid="B2">Bachman, 2013</xref>; <xref ref-type="bibr" rid="B15">Hu et al., 2006</xref>). Once extracted, these reads are processed in parallel to produce short reads that are compiled by protein region to assemble the amino acid sequence. Once the base-pair content is known, codons can be assembled to produce the full protein.</p>
<p>Typical experimental protocols synthesize mutated DNA by using restriction digestion to excise the protein region of interest (<xref ref-type="bibr" rid="B27">Saiki et al., 1988</xref>; <xref ref-type="bibr" rid="B2">Bachman, 2013</xref>; <xref ref-type="bibr" rid="B23">Li et al., 2025</xref>; <xref ref-type="bibr" rid="B18">Jumper et al., 2021</xref>). Using synthetic DNA copies from phosphoramidite chemistry, a heteroduplex forms between mutant and wild-type sequences, and DNA polymerase synthesizes the mutant DNA, which is extracted using methylation-restriction digestion. Computationally, this process is far simpler, as the chemical behavior of proteins can be modeled using the sequence in AlphaFold with developed thresholding algorithms (<xref ref-type="bibr" rid="B10">Evans et al., 2021</xref>; <xref ref-type="bibr" rid="B25">Mirdita et al., 2022</xref>; <xref ref-type="bibr" rid="B28">Senior et al., 2020</xref>; <xref ref-type="bibr" rid="B31">Varadi et al., 2022</xref>; <xref ref-type="bibr" rid="B9">Epifanovsky et al., 2021</xref>). Using AlphaFold or ColabFold, multiple sequence alignments of protein inputs can be compared against evolutionary variants to predict protein geometry, which is then used to determine bond angles, turns, and secondary structures (<xref ref-type="bibr" rid="B10">Evans et al., 2021</xref>; <xref ref-type="bibr" rid="B25">Mirdita et al., 2022</xref>; <xref ref-type="bibr" rid="B28">Senior et al., 2020</xref>; <xref ref-type="bibr" rid="B31">Varadi et al., 2022</xref>; <xref ref-type="bibr" rid="B9">Epifanovsky et al., 2021</xref>). These generated protein structure files can be used for molecular dynamics simulations to analyze mechanistic behavior in isolated systems. However, since most mutations are random and functionally invariant, it is difficult to determine which p53 mutants are functionally significant.</p>
<p>Using Q-Chem, electron density distributions can be analyzed to identify electronic perturbations associated with protein mutations (<xref ref-type="bibr" rid="B29">Shao et al., 2006</xref>; <xref ref-type="bibr" rid="B13">Helgaker et al., 2000</xref>; <xref ref-type="bibr" rid="B30">Szabo and Ostlund, 1996</xref>; <xref ref-type="bibr" rid="B26">Parr and Yang, 1989</xref>; <xref ref-type="bibr" rid="B1">Achatz and Zambetti, 2016</xref>). Q-Chem provides this analysis by solving the Schr&#xf6;dinger equation using density-functional theory and Gaussian basis functions, assuming electrons move within probability densities around nuclei. This can be used to understand transition states and activation states in proteins, and the basis of chemical transitions within these systems. Using Natural Population Analysis, electron densities around nuclei can be quantified and compiled into natural orbitals, yielding stable means to measure charge and electron transfer. Electrostatic potentials and orbital occupations provide a way to track mechanistic differences within proteins for large-scale mutational studies. This provides a means to understand protein misfolding and altered reactivity within the tumor microenvironment. We hypothesize that AlphaFold can be used to generate large cohorts of Protein Data Bank (PDB) structures for quantum-chemical analysis for broad population-genetics studies (<xref ref-type="bibr" rid="B4">Buel and Walters, 2022</xref>).</p>
<p>Quantum chemical analysis provides a means to interrogate mutation-induced changes that are not directly observable from sequence or structural prediction alone. While structure-prediction methods capture global folding and domain organization, electronic descriptors derived from Q-Chem quantify how point mutations alter local charge distributions, electrostatic potential, and orbital stability that underlie biochemical interactions. In TP53, these electronic perturbations are relevant to zinc coordination, DNA-binding affinity, and tetramerization, where small changes in charge polarization or electronegativity can disrupt functional interactions without requiring large-scale structural rearrangement. As such, Q-Chem analytics enable a mechanistic interpretation of missense mutations by linking sequence variation to localized electronic effects that contribute to pathogenic dysfunction.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and methods</title>
<p>Within the TCGA-BRCA cohort, 28 WXS samples were randomly selected to be processed into FASTA files to maximize variability, with one control p53 PDB. The control TP53 sequence was derived from UniProt P04637 (<xref ref-type="bibr" rid="B4">Buel and Kylie, 2022</xref>). For the feasibility analysis, the 28 mutants were chosen to demonstrate the capability of the analysis, rather than to demonstrate experimental analysis. Due to the sample size, there is no guarantee of statistical reproducibility or robustness within the analyzed 28 WXS samples. All genetic analyses were performed on the entire BRCA cohort. Each chosen WXS mutant was characterized by its specific substitution and documented. ColabFold was used to generate five biological replicates of each mutant protein structure. Five ColabFold structural predictions were generated for each mutant; a single representative structure was selected for feasibility analysis to limit computational cost. OpenBabel was used to supply adequate hydrogens and ensure neutrality. Q-Chem 6.3.0 and Amber24 were used on the Ohio Supercomputer Center&#x2019;s Ascend cluster, running on NVIDIA A100 GPUs. AlphaFold 2.3.2 was accessed through ColabFold, in conjunction with Biopython, for structure inference. All base-pair sequences for each mutant in the whole-exome dataset were stored in a CSV named after the file ID, converted into amino-acid labels, and written into FASTA files for AlphaFold generation.</p>
<p>RMSD values and chemical shifts were extracted using BioPDB, and all inputs for sequential Q-Chem analysis were generated using Biopython and BioPDB. Quantum chemical calculations were performed on residue-centered local fragments (&#xb1;1 residue), ensuring that low-confidence global regions of AlphaFold/ColabFold models do not propagate into the electronic structure analysis. Local fragment-based quantum mechanical calculations do not require explicit propagation of global structure-prediction uncertainty, as the electronic structure is computed deterministically from fixed local geometries and interpreted in a comparative framework. All code is provided on GitHub for accessibility. Each input was then run in Q-Chem using a sequential shell script, in which Natural Population Analyses, Electrostatic Potentials, and orbital occupations (HOMO/LUMO) were computed. Electrostatic potentials were analyzed using the following parameters shown in <xref ref-type="table" rid="T1">Table 1</xref>, and the workflow for the analysis is shown in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Q-Chem input parameters used for ESP charge calculation, NPA analysis, and HOMO/LUMO orbital extraction.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Parameter</th>
<th align="center">ESP (CHELPG)</th>
<th align="center">NPA</th>
<th align="center">HOMO/LUMO</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">JOBTYPE</td>
<td align="center">SP</td>
<td align="center">SP</td>
<td align="center">SP</td>
</tr>
<tr>
<td align="left">METHOD</td>
<td align="center">B3LYP</td>
<td align="center">B3LYP</td>
<td align="center">B3LYP</td>
</tr>
<tr>
<td align="left">BASIS</td>
<td align="center">6&#x2013;31G&#x2a;</td>
<td align="center">6&#x2013;31G&#x2a;</td>
<td align="center">6&#x2013;31G&#x2a;</td>
</tr>
<tr>
<td align="left">SCF_CONVERGENCE</td>
<td align="center">7</td>
<td align="center">7</td>
<td align="center">7</td>
</tr>
<tr>
<td align="left">MAX_SCF_CYCLES</td>
<td align="center">200</td>
<td align="center">200</td>
<td align="center">200</td>
</tr>
<tr>
<td align="left">SCF_ALGORITHM</td>
<td align="center">DIIS_GDM</td>
<td align="center">DIIS_GDM</td>
<td align="center">DIIS_GDM</td>
</tr>
<tr>
<td align="left">SYM_IGNORE</td>
<td align="center">1</td>
<td align="center">1</td>
<td align="center">1</td>
</tr>
<tr>
<td align="left">NO_REORIENT</td>
<td align="center">1</td>
<td align="center">1</td>
<td align="center">1</td>
</tr>
<tr>
<td align="left">CHELPG</td>
<td align="center">TRUE</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="left">NBO</td>
<td align="center">&#x2014;</td>
<td align="center">1</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="left">PRINT_ORBITALS</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">TRUE</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Compact multi-row flowchart summarizing the computational pipeline from WXS data to structural modeling (AlphaFold) and quantum chemical analysis (Q-Chem).</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g001.tif">
<alt-text content-type="machine-generated">Flowchart illustrating a genomic workflow with four steps: whole-exome sequencing, variant calling and FASTA generation, structure prediction using AlphaFold, and quantum chemical analysis using Q-Chem, connected by downward arrows.</alt-text>
</graphic>
</fig>
<p>While the 6&#x2013;31G basis set provides advantageous computational speed and processing for larger sample sizes and analysis, it is acknowledged that the basis set is smaller and reduces accuracy in comparison to conventional basis sets. Specifically, 6&#x2013;31G lacks diffuse orbitals and angular momentum functions used to describe certain anionic or long-range electrostatic phenomena. In this study, the 6&#x2013;31G basis set was used for scaling and feasibility testing of Q-Chem analysis on the derived PDB files, rather than to improve the accuracy of the proposed method.</p>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>The results of the sequence generation analysis and ColabFold generation show low confidence within the proline-rich regions and a substantial portion of the DNA-binding domain, as shown in <xref ref-type="fig" rid="F2">Figure 2</xref>, likely due to the absence of evolutionary variants. <xref ref-type="table" rid="T2">Table 2</xref> displays summary statistics for the cohort, demonstrating a high proportion of missense mutations in addition to most of the mutations being located within the DNA-Binding Domain. This is reasonable, as most cancer-associated mutations are not natural or evolutionarily promoted (<xref ref-type="bibr" rid="B11">Giacomelli et al., 2018</xref>). Previous work has demonstrated that AlphaFold2 produces missense point-mutational protein structures that are very similar to the original protein structure (<xref ref-type="bibr" rid="B12">Haley, 2025</xref>). In addition, it has been observed that there is no correlation between pLDDT scores and the conservation of proteins such as green fluorescent protein, resulting in similar structures regardless of point mutations (<xref ref-type="bibr" rid="B12">Haley, 2025</xref>). In this study, we observe drastically lower pLDDT scores across all selected mutants, reflecting the use of a wider range of missense mutations. Previous studies validating AlphaFold&#x2019;s reconstruction performance have suggested that only 33% of human proteins in AlphaFold2 have confidence scores lower than 70% (<xref ref-type="bibr" rid="B14">Hosseini et al., 2025</xref>). This suggests that the model could not identify an adequate PDB template to model the protein, which resulted in a loss of structure relative to the original wild-type PDB. This led to disconfiguration of several domains, particularly the disruption of the beta-sandwich fold in the DNA-binding domain. This does not suggest contradictory results, as AlphaFold has not been shown to be accurate in reconstructing mutated proteins. Rather, the results demonstrate that the generated mutations are capable of inducing structural changes consistent with those expected from point mutations. This indicates that AlphaFold can model global folding patterns, while quantum chemical analysis is justified to ensure accurate predictions at the electronic level. Low-confidence generated structures are therefore used comparatively to assess local trends in electronic dispersion, without reliance on or interpretation of global structural effects. In addition, there are more than 100 distinct mutations within the cohort that arise in patients with breast cancer, and these sequences originate from malignant cells. Since most mutations were synthetic, the MSA could not identify an evolutionary match to the protein other than the original TP53 sequence. Nevertheless, protein generation was successful.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>AlphaFold/ColabFold structural prediction outputs for TP53 C176 variants. The full-width panel shows the predicted aligned error (PAE). The bottom row shows per-residue pLDDT confidence scores and the MSA sequence coverage. <bold>(a)</bold> Predicted aligned error (PAE). <bold>(b)</bold> Per-residue pLDDT confidence. <bold>(c)</bold> MSA sequence coverage.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g002.tif">
<alt-text content-type="machine-generated">Five heatmaps labeled rank one through rank five show predicted aligned error (PAE) matrices with a color scale from blue to red. Below, a line graph plots predicted IDDT per position for all five ranks, showing variability across positions. To the right, a rectangular heatmap displays MSA sequence coverage with a predominantly purple color bar indicating sequence identity to the query.</alt-text>
</graphic>
</fig>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Summary of TP53 mutation statistics.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Metric</th>
<th align="center">Value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Total TP53 mutation records</td>
<td align="center">256</td>
</tr>
<tr>
<td align="left">Unique samples with TP53 mutation</td>
<td align="center">253</td>
</tr>
<tr>
<td align="left">Unique TP53 HGVSp variants</td>
<td align="center">127</td>
</tr>
<tr>
<td align="left">Missense mutations</td>
<td align="center">204</td>
</tr>
<tr>
<td align="left">Nonsense mutations</td>
<td align="center">52</td>
</tr>
<tr>
<td align="left">Mutations in TAD1 (1&#x2013;40)</td>
<td align="center">1</td>
</tr>
<tr>
<td align="left">Mutations in TAD2 (41&#x2013;61)</td>
<td align="center">4</td>
</tr>
<tr>
<td align="left">Mutations in PRR (62&#x2013;93)</td>
<td align="center">1</td>
</tr>
<tr>
<td align="left">Mutations in DBD (94&#x2013;292)</td>
<td align="center">232</td>
</tr>
<tr>
<td align="left">Mutations in OD (323&#x2013;356)</td>
<td align="center">13</td>
</tr>
<tr>
<td align="left">Mutations out of canonical range</td>
<td align="center">5</td>
</tr>
<tr>
<td align="left">Non-truncating mutations</td>
<td align="center">204</td>
</tr>
<tr>
<td align="left">Truncating mutations</td>
<td align="center">52</td>
</tr>
<tr>
<td align="left">Conservative missense mutations</td>
<td align="center">62</td>
</tr>
<tr>
<td align="left">Non-conservative missense mutations</td>
<td align="center">142</td>
</tr>
<tr>
<td align="left">Mutations with unchanged protein length</td>
<td align="center">256</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Analytically, most mutations occurred in the DNA-binding domain, as shown in <xref ref-type="fig" rid="F3">Figure 3</xref>, which presents a statistically significant finding that these mutations arise despite the availability of residues. Most mutations in this cohort were missense rather than nonsense mutations, which is statistically more likely based on prior literature on mutational patterns in TP53 (<xref ref-type="bibr" rid="B11">Giacomelli et al., 2018</xref>). Most protein mutations were non-truncated, and as expected, all nonsense mutations resulted in shorter proteins.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>TP53 mutational landscape in the BRCA cohort: global mutation characteristics, truncation status, and biochemical severity. TP53 mutational landscape in the BRCA cohort (ext.): positional distributions, hotspot structure, and recurrent variants. <bold>(a)</bold> Mutation type distribution. <bold>(b)</bold> Domain-wise mutation counts. <bold>(c)</bold> Missense vs. nonsense per domain. <bold>(d)</bold> Truncating vs. non-truncating mutations. <bold>(e)</bold> Samples with truncating TP53 mutations. <bold>(f)</bold> Conservative vs. non-conservative missense. <bold>(g)</bold> Distribution of mutation positions. <bold>(h)</bold> Per-position sample counts (hotspots). <bold>(i)</bold> Top recurrent TP53 variants. <bold>(j)</bold> Top recurrent missense substitutions.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g003.tif">
<alt-text content-type="machine-generated">Panel (a) shows a bar chart of TP53 mutation type distribution with missense mutations being more frequent than nonsense mutations. Panel (b) displays a bar chart of TP53 mutations by domain, with most mutations in the DBD domain. Panel (c) is a stacked bar chart of mutation types per domain, indicating missense and nonsense contributions for each domain. Panel (d) compares the number of truncating versus non-truncating TP53 mutations, showing non-truncating mutations are more common. Panel (e) presents the number of samples with and without truncating mutations, showing more samples without. Panel (f) visualizes conservative versus non-conservative missense mutations, with non-conservative being higher. Panel (g) depicts distribution of TP53 mutation positions across residues. Panel (h) presents a lollipop plot showing TP53 mutation hotspots by residue position. Panel (i) shows a bar chart of the top 20 recurrent TP53 variants, with some variants recurrent in more samples. Panel (j) displays the top 20 recurrent missense substitutions in TP53, highlighting frequent amino-acid changes.</alt-text>
</graphic>
</fig>
<p>Biochemically, most of these mutations were evaluated to be non-conservative according to BLOSUM62 scoring and the recorded amino acid substitutions. Most mutations occur within residues 150&#x2013;200, which correspond to the zinc-binding residues that functionalize TP53 DNA binding (<xref ref-type="bibr" rid="B6">Cho et al., 1994</xref>; <xref ref-type="bibr" rid="B17">Joerger and Alan, 2008</xref>; <xref ref-type="bibr" rid="B5">Bullock and Fersht, 2001</xref>). A secondary hotspot occurs between residues 250&#x2013;300, corresponding to arginine-binding positions that orient the helical structures of the dimerization complex (<xref ref-type="bibr" rid="B6">Cho et al., 1994</xref>; <xref ref-type="bibr" rid="B17">Joerger and Alan, 2008</xref>; <xref ref-type="bibr" rid="B5">Bullock and Fersht, 2001</xref>). The highest-frequency mutation was R157H, which occurs in the DNA-binding domain and results in downregulation of BMI1 and increased expression of TWIST1, producing epigenetic deformation and unregulated gene expression. Mutant variants such as R273H and R196, which have been found in myeloid acute leukemia and triple-negative breast cancer, respectively, correspond to worse prognosis (<xref ref-type="bibr" rid="B6">Cho et al., 1994</xref>; <xref ref-type="bibr" rid="B17">Joerger and Alan, 2008</xref>; <xref ref-type="bibr" rid="B5">Bullock and Fersht, 2001</xref>; <xref ref-type="bibr" rid="B11">Giacomelli et al., 2018</xref>). The most common amino acid substitution is from arginine to histidine, corresponding to the most frequent mutations within the BRCA cohort, all of which destabilize the DNA-binding domain and contribute to proliferation and reduced survival.</p>
<p>The results for the wild-type AlphaFold generation in <xref ref-type="fig" rid="F4">Figure 4</xref> showed high confidence and stable generation of replicates, with evolutionary convergence and high-confidence predictions within the DNA-binding domain. The predicted alignment error demonstrated high confidence across ranks. Wild-type generation of ColabFold structures was successful overall.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>AlphaFold/ColabFold structural prediction outputs for TP53 Wild-Type. The full-width panel shows the predicted aligned error (PAE). The bottom row shows per-residue pLDDT confidence scores and the MSA sequence coverage. <bold>(a)</bold> Predicted aligned error (PAE). <bold>(b)</bold> Per-residue pLDDT confidence. <bold>(c)</bold> MSA sequence coverage.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g004.tif">
<alt-text content-type="machine-generated">Panel (a) contains five contact maps labeled rank_1 to rank_5, showing distance matrices with a blue diagonal and red background, indicating predicted residue-residue distances. Panel (b) is a line graph titled &#x22;Predicted IDDT per position,&#x22; displaying predicted IDDT values on the y-axis across positions for each rank in different colors. Panel (c) is a sequence coverage heatmap, with sequences on the y-axis and positions on the x-axis, colored by sequence identity to query, and a black line representing sequence coverage across positions.</alt-text>
</graphic>
</fig>
<p>The display for the wild-type protein shown in <xref ref-type="fig" rid="F5">Figure 5</xref> was extracted from the Protein Data Bank, and the mutant structures were displayed on the left. Based on the generated structures, the beta-sandwich folds were not conserved, along with a substantial portion of the alpha-helical regions. Low-confidence regions are observed in the unstructured strands, and low-confidence wild-type strands are also shown within proline-rich regions and transactivation domains. The structures were conserved adequately for Q-Chem analysis.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Comparison of the predicted structures for wildtype and mutant TP53. Structural differences are visualized using AlphaFold/ColabFold predicted coordinates. <bold>(a)</bold> Wildtype TP53 structure. <bold>(b)</bold> Mutant TP53 structure.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g005.tif">
<alt-text content-type="machine-generated">Panel (a) shows a ribbon diagram of a protein structure using a blue to red color gradient to represent its folding, while panel (b) displays a similar protein structure in green without gradient coloring.</alt-text>
</graphic>
</fig>
<p>Across the 28 mutants shown in <xref ref-type="fig" rid="F6">Figure 6</xref>, a lower electrostatic potential was observed across the cohort, as shown in <xref ref-type="fig" rid="F7">Figure 7</xref>, characterized by substitution of polar amino acids in conserved domains in the DNA-binding region (<xref ref-type="bibr" rid="B6">Cho et al., 1994</xref>; <xref ref-type="bibr" rid="B17">Joerger and Alan, 2008</xref>; <xref ref-type="bibr" rid="B5">Bullock and Fersht, 2001</xref>; <xref ref-type="bibr" rid="B9">Epifanovsky et al., 2021</xref>; <xref ref-type="bibr" rid="B29">Shao et al., 2006</xref>; <xref ref-type="bibr" rid="B13">Helgaker et al., 2000</xref>). High variability was also demonstrated across all mutants, though most mutations resulting in neutral residue substitution had similar variance. Mutants that resulted in substitutions of similar chemical character showed similar variability. Within the mutant cohort were seven cysteine-mutated variants, all within the binding domain that sever the zinc linkage (<xref ref-type="bibr" rid="B6">Cho et al., 1994</xref>; <xref ref-type="bibr" rid="B17">Joerger and Alan, 2008</xref>; <xref ref-type="bibr" rid="B5">Bullock and Fersht, 2001</xref>), one alanine mutant, three aspartate mutations, three glutamate mutations, three phenylalanine mutations, and three glycine mutants. Within this cohort, the glycine mutants typically substituted larger amino acids, while the glutamine mutants resulted in a complete shift from a negatively charged amino acid to a positive one. The phenylalanine mutants showed a shift toward polar thiols, representing a negative shift in charge, with most of these mutations concentrated within the dimerization complex. The cysteine mutations showed a mixed set of potential shifts in both directions, while the aspartate mutations were typically substituted with neutral or hydrophobic amino acids. Across the atomic charge distributions within the fragments of the first five mutants, the cysteine mutants demonstrated an overwhelming similarity at the mutation point and showed correlation with large decreases in ESP (<xref ref-type="bibr" rid="B29">Shao et al., 2006</xref>; <xref ref-type="bibr" rid="B13">Helgaker et al., 2000</xref>; <xref ref-type="bibr" rid="B30">Szabo and Ostlund, 1996</xref>; <xref ref-type="bibr" rid="B26">Parr and Yang, 1989</xref>; <xref ref-type="bibr" rid="B1">Achatz and Zambetti, 2016</xref>). The distribution across mutants shows a decrease in electric charge, which can be inferred from a subset of mutants, including glycine and cysteine variants, being replaced with polar residues. However, this could also be the result of the natural limitations of ESP analysis, especially at distances below 3 &#xc5; and when using a smaller basis set (6&#x2013;31G) (<xref ref-type="bibr" rid="B14">Hosseini et al., 2025</xref>). In this instance, ESP was used as a comparative analysis across all samples to infer structural changes from the ColabFold generation. This suggests that residue polarity shifts the stability and binding capacity of the DNA-binding region within the ColabFold-generated mutants.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>List of TP53 missense mutants analyzed in this study, showing residue position and amino-acid substitution relative to the wild-type sequence.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g006.tif">
<alt-text content-type="machine-generated">Table listing twenty-nine mutations, displaying each mutation's notation and corresponding amino acid substitution. Columns include mutation number, mutation code, and amino acid change, with both full names and single-letter codes indicated for previous and substituted amino acids.</alt-text>
</graphic>
</fig>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Using sinistrodextral labels, Electrostatic potential (ESP) analyses including <bold>(a)</bold> heatmap, <bold>(b)</bold> PCA, <bold>(c)</bold> first-mutant line plots, and <bold>(d)</bold> histogram of summed ESP charges <bold>(d)</bold>.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g007.tif">
<alt-text content-type="machine-generated">Four scientific data visualizations summarizing ESP atomic charges across mutants: (a) heatmap showing charge variation by atom and mutant index, (b) scatter plot of PCA charge vectors, (c) line graph comparing atomic charge distributions for selected mutants, (d) bar chart displaying total ESP charge distribution among mutants.</alt-text>
</graphic>
</fig>
<p>Within the mutation fragments, the electronic distributions in <xref ref-type="fig" rid="F8">Figure 8</xref> were sparse. Across the first few mutants, the Natural Population Analysis demonstrated that each of the four cysteine mutations showed unique differences in charge across the atoms within the fragment, yet heavy convergence was noted at the third atom index, likely a component shared across all mutants (<xref ref-type="bibr" rid="B29">Shao et al., 2006</xref>; <xref ref-type="bibr" rid="B13">Helgaker et al., 2000</xref>; <xref ref-type="bibr" rid="B30">Szabo and Ostlund, 1996</xref>; <xref ref-type="bibr" rid="B26">Parr and Yang, 1989</xref>; <xref ref-type="bibr" rid="B1">Achatz and Zambetti, 2016</xref>). The distribution of charge across the NPA output contained outliers, though a high frequency of observations between 0.4 and 0.5, when summed over atoms, demonstrated high polarization within the fragment, with several mutants showing greater polarization approaching 0.7. The electron distributions in these mutants are overwhelmingly undersaturated, resulting in high polarization (<xref ref-type="bibr" rid="B29">Shao et al., 2006</xref>; <xref ref-type="bibr" rid="B13">Helgaker et al., 2000</xref>; <xref ref-type="bibr" rid="B30">Szabo and Ostlund, 1996</xref>; <xref ref-type="bibr" rid="B26">Parr and Yang, 1989</xref>; <xref ref-type="bibr" rid="B1">Achatz and Zambetti, 2016</xref>). This is consistent with the mechanisms by which the orientation of the DNA-binding domain collapses under disrupted zinc coordination and altered charge density.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Using sinistrodextral labels, Natural Population Analysis (NPA) charge analyses including <bold>(a)</bold> heatmap, <bold>(b)</bold> PCA, <bold>(c)</bold> first-mutant line plots, and <bold>(d)</bold> histogram of summed NPA charges.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g008.tif">
<alt-text content-type="machine-generated">Panel (a) contains a heatmap showing NPA atomic charge values across mutants, where color intensity varies from blue to red indicating charge magnitude. Panel (b) presents a scatter plot of principal component analysis (PCA) of NPA charge vectors, with points representing individual mutants distributed along two principal components. Panel (c) features a line graph depicting NPA atomic charge distributions for the first few mutants, each represented by a distinct colored line across different atom indices. Panel (d) displays a histogram illustrating the distribution of total NPA charge summed over atoms, with frequency counts for different charge intervals.</alt-text>
</graphic>
</fig>
<p>Across the HOMO and LUMO distribution in <xref ref-type="fig" rid="F9">Figure 9</xref>, a high frequency of mutants displayed an overwhelmingly electronically stable distribution, which presents a limitation of the analysis. While ESP and NPA results conclude that the electrostatic potential is reduced and that the electron distribution across fragments is sparse, HOMO/LUMO analysis indicated relatively stable frontier orbital energies across mutants, underscoring the limited discriminatory power of HOMO&#x2013;LUMO metrics in this context. Many orbital energies were much lower than &#x2212;1.5, suggesting higher electronegativity within these atomic regions, though it is apparent that, across samples, the electronic stability across atoms is consistent among all mutants.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Using sinistrodextral labels, Quantum mechanical electronic structure metrics including <bold>(A)</bold> HOMO&#x2013;LUMO energy gap histogram and <bold>(B)</bold> HOMO&#x2013;LUMO scatter distribution across mutants.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g009.tif">
<alt-text content-type="machine-generated">Histogram on the left presents the distribution of HOMO-LUMO gaps in electron volts for various mutants, with most gaps between 0.8 and 1.2 electron volts. Scatterplot on the right displays HOMO and LUMO energies in electron volts for mutants indexed along the x-axis, with HOMO energies lower and LUMO energies higher, both showing variability among mutants.</alt-text>
</graphic>
</fig>
<p>In order to compare the unstable mutants to the wild type, differences between the quantum electronic properties of each mutant and the wild type were graphed for NPA, ESP, and HOMO/LUMO analyses in <xref ref-type="fig" rid="F10">Figure 10</xref>. Across each atom in the mutant structures, there is consistently higher electronic sparsity compared to the wild type, with the exception of indices 10 and 20, which likely correspond to hydrogenous regions. The ESP values for the mutants were lower than those of the wild type across most variants. This suggests that electronic sparsity and reduced electrostatic potential may contribute to destabilization of DNA-binding or tetramerization regions by decreasing electronegativity in these regions. The orbital energies were much higher in the mutants than in the wild type, indicating lower electronegativity across the mutants. While these conclusions are limited by low-confidence ColabFold generations, they remain consistent with prior literature on mechanisms of TP53 affinity and structural destabilization.</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Quantum-chemical perturbation of TP53 mutants relative to the wild-type (WT) fragment. <bold>(a)</bold> and <bold>(b)</bold> show WT-referenced changes in NPA and ESP atomic charges, respectively, highlighting residues and environments with strong electronic redistribution. <bold>(c)</bold> links frontier-orbital perturbation (HOMO&#x2013;LUMO gap) to the total magnitude of charge reorganization, summarizing how severely each mutant distorts the local electronic structure relative to WT. <bold>(a)</bold> ANPA atomic charges vs WT fragment. Each row corresponds to a TP53 mutant (in- cluding WT), each column to an atom index in the QM fragment; colors indicate the change in NPA charge relative to WT. <bold>(b)</bold> AESP (ChEIPG) atomic charges vs WT fragment. Each row corresponds to a TP53 mu- tant; colors indicate the change in ESP-derived partial charge relative to WT. <bold>(c)</bold> Relationship between HOMO-LUMO gap (eV) and the magnitude of the WT-referenced charge perturbation (L1 norm of Acharge vector). Each point is a TP53 mutant; larger values indicate stronger electronic disruption relative to WT.</p>
</caption>
<graphic xlink:href="fmolb-13-1770157-g010.tif">
<alt-text content-type="machine-generated">Panel (a) shows a heatmap of &#x394;NPA atomic charges versus wild-type fragment, with color ranging from blue (negative) to red (positive); panel (b) shows a similar heatmap for &#x394;ESP (CHELPG) atomic charges, using a comparable color scale; panel (c) displays a scatter plot with NPA L1 &#x394;charge versus wild-type on the y-axis and HOMO-LUMO gap (in electron volts) on the x-axis, indicating a general trend where higher electronic gaps correspond to lower &#x394;charge values.</alt-text>
</graphic>
</fig>
<p>The study presents a successful synthesis of mutant PDB forms, with electronic patterns characterized by lower electronegativity and sparse charge distribution. Likewise, there is lower electrostatic potential in these mutant types, reflecting low sample variability.</p>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>Population-level mutant analysis is possible using mass analysis of WXS sequencing. Transfer of these informatics into FASTA format and sequential ColabFold generation was successful, though confidence was unremarkable. Electrostatic potential was consistently lower in the mutant cohort due to the low sample size, and the electronic distribution was consistently more sparse, likely due to heavy residues and mutations with aromatic groups. Nevertheless, these mutations consistently exhibited lower electronegativity, which is compatible with previously reported destabilization mechanisms of DNA-binding domains and tetramerization regions. Orbital analyses demonstrated higher electronic stability within the mutants, and additional analyses can be performed to produce Raman spectra, chemical shifts, and nuclear magnetic resonance data across these fragments. These analyses can be used to perform cohort-level quantum characterization of gene mutations crucial in oncogenesis, more specifically, oncogenic processes.</p>
<p>Mass analysis of cancer cohort data can provide general mechanistic observations and characteristics regarding how mutations result in protein dysfunction. We generated structures for 28 mutants within the BRCA cohort using a developed pipeline and performed large-scale quantum chemical analysis to understand general trends in mutative behavior in TP53. For future studies, additional features can be developed specifically for high-confidence mutation prediction, in conjunction with physicochemical analysis.</p>
</sec>
<sec id="s5">
<title>Limitations</title>
<p>This study is limited by the low-confidence generation of ColabFold structures and does not use all five biological replicates. While the Q-Chem analyses are complete, the limited sample size constrains statistical generalization, positioning this study as a feasibility analysis. The pipeline is also limited by the use of ColabFold-generated wild-type structures. MSA was not able to generate high-confidence evolutionarily similar proteins for prediction of high-confidence regions, such that in-depth analysis of mutations in other domains is limited. The limited sample size of the BRCA cohort means that mutation analyses are valid primarily with respect to replicating previous observations reported in prior studies.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/supplementary material. All code is available on GitHub: <ext-link ext-link-type="uri" xlink:href="https://github.com/Alejandro21236/GenBlosum-WXSQCHEM">https://github.com/Alejandro21236/GenBlosum-WXSQCHEM</ext-link>.</p>
</sec>
<sec sec-type="author-contributions" id="s7">
<title>Author contributions</title>
<p>AL: Writing &#x2013; original draft, Methodology, Investigation, Visualization, Software, Validation, Data curation, Formal Analysis, Resources, Conceptualization. MN: Writing &#x2013; review and editing, Supervision, Project administration.</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was used in the creation of this manuscript. Grammar Correction and Punctuation.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Achatz</surname>
<given-names>M. I.</given-names>
</name>
<name>
<surname>Zambetti</surname>
<given-names>G. P.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>The inherited P53 mutation in the Brazilian population</article-title>. <source>Cold Spring Harb. Perspect. Med.</source> <volume>6</volume> (<issue>12</issue>), <fpage>a026195</fpage>. <pub-id pub-id-type="doi">10.1101/cshperspect.a026195</pub-id>
<pub-id pub-id-type="pmid">27663983</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bachman</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Site-directed mutagenesis</article-title>. <source>Methods Enzym.</source> <volume>529</volume>, <fpage>241</fpage>&#x2013;<lpage>248</lpage>. <pub-id pub-id-type="doi">10.1016/B978-0-12-418687-3.00019-7</pub-id>
<pub-id pub-id-type="pmid">24011050</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beaucage</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Caruthers</surname>
<given-names>M. H.</given-names>
</name>
</person-group> (<year>1981</year>). <article-title>Deoxynucleoside phosphoramidites&#x2014;A new class of key intermediates for deoxypolynucleotide synthesis</article-title>. <source>Tetrahedron Lett.</source> <volume>22</volume> (<issue>20</issue>), <fpage>1859</fpage>&#x2013;<lpage>1862</lpage>. <pub-id pub-id-type="doi">10.1016/s0040-4039(01)90461-7</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buel</surname>
<given-names>G. R.</given-names>
</name>
<name>
<surname>Kylie</surname>
<given-names>J. W.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Can AlphaFold2 predict the impact of missense mutations on structure?</article-title> <source>Nat. Struct. &#x26; Mol. Biol.</source> <volume>29</volume>, <fpage>1</fpage>&#x2013;<lpage>2</lpage>. <pub-id pub-id-type="doi">10.1038/s41594-021-00728-3</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bullock</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Fersht</surname>
<given-names>A. R.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Rescuing the function of mutant p53</article-title>. <source>Nat. Rev. Cancer</source> <volume>1</volume>, <fpage>68</fpage>&#x2013;<lpage>76</lpage>. <pub-id pub-id-type="doi">10.1038/35094077</pub-id>
<pub-id pub-id-type="pmid">11900253</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cho</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gorina</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jeffrey</surname>
<given-names>P. D.</given-names>
</name>
<name>
<surname>Pavletich</surname>
<given-names>N. P.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Crystal structure of a p53 tumor Suppressor&#x2013;DNA complex: understanding tumorigenic mutations</article-title>. <source>Science</source> <volume>265</volume> (<issue>5170</issue>), <fpage>346</fpage>&#x2013;<lpage>355</lpage>. <pub-id pub-id-type="doi">10.1126/science.8023157</pub-id>
<pub-id pub-id-type="pmid">8023157</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Clore</surname>
<given-names>G. M.</given-names>
</name>
<name>
<surname>Omichinski</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Sakaguchi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zambrano</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Sakamoto</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Appella</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>1994</year>). <article-title>High-resolution structure of the oligomerization domain of P53 by multidimensional NMR</article-title>. <source>Science</source> <volume>265</volume> (<issue>5170</issue>), <fpage>386</fpage>&#x2013;<lpage>391</lpage>. <pub-id pub-id-type="doi">10.1126/science.8023159</pub-id>
<pub-id pub-id-type="pmid">8023159</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dyson</surname>
<given-names>H. J.</given-names>
</name>
<name>
<surname>Wright</surname>
<given-names>P. E.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>How does P53 work? Regulation by the intrinsically disordered domains</article-title>. <source>Trends Biochem. Sci.</source> <volume>50</volume> (<issue>1</issue>), <fpage>9</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1016/j.tibs.2024.10.009</pub-id>
<pub-id pub-id-type="pmid">39578215</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Epifanovsky</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Gilbert</surname>
<given-names>A. T. B.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mardirossian</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Software for the frontiers of quantum chemistry: an overview of the Q-Chem 5 package</article-title>. <source>J. Chem. Phys.</source> <volume>155</volume> (<issue>8</issue>), <fpage>084801</fpage>. <pub-id pub-id-type="doi">10.1063/5.0055522</pub-id>
<pub-id pub-id-type="pmid">34470363</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Evans</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>O&#x2019;Neill</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pritzel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Antropova</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Senior</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Protein complex prediction with AlphaFold-Multimer</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2021.10.04.463034</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Giacomelli</surname>
<given-names>A. O.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lintner</surname>
<given-names>R. E.</given-names>
</name>
<name>
<surname>McFarland</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Duby</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Mutational processes shape the landscape of TP53 mutations in human cancer</article-title>. <source>Nat. Genet.</source> <volume>50</volume> (<issue>10</issue>), <fpage>1381</fpage>&#x2013;<lpage>1387</lpage>. <pub-id pub-id-type="doi">10.1038/s41588-018-0204-y</pub-id>
<pub-id pub-id-type="pmid">30224644</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Haley</surname>
<given-names>O. C.</given-names>
</name>
<name>
<surname>Tibbs-Cortes</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Hayford</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Harding</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Woodhouse</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cannon</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>Why do some predicted protein structures fold poorly? Benchmarking AlphaFold, ESMFold, and boltz in maize</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2025.07.05.663230</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Helgaker</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>J&#xf8;rgensen</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Olsen</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2000</year>). <source>Molecular electronic-structure theory</source>. <publisher-name>Wiley</publisher-name>.</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hosseini</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>K&#x159;&#xed;&#x17e;</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>van der Spoel</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Accurate electrostatics for biomolecular systems through machine learning</article-title>.</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Jeffrey</surname>
<given-names>P. D.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Structural basis of competitive recognition of P53 and MDM2 by HAUSP/USP7: implications for the regulation of the P53&#x2013;MDM2 pathway</article-title>. <source>PLoS Biol.</source> <volume>4</volume> (<issue>2</issue>), <fpage>e27</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pbio.0040027</pub-id>
<pub-id pub-id-type="pmid">16402859</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hulboy</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Lozano</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Structural and functional analysis of P53: the acidic activation domain has transforming capability</article-title>. <source>Cell Growth &#x26; Differ.</source> <volume>5</volume> (<issue>10</issue>), <fpage>1023</fpage>&#x2013;<lpage>1031</lpage>.<pub-id pub-id-type="pmid">7848903</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Joerger</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Alan</surname>
<given-names>R. F.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Structural biology of the tumor suppressor p53</article-title>. <source>Oncogene</source> <volume>27</volume> (<issue>50</issue>), <fpage>6141</fpage>&#x2013;<lpage>6149</lpage>.<pub-id pub-id-type="pmid">18591933</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jumper</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Evans</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Pritzel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Figurnov</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ronneberger</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Highly accurate protein structure prediction with AlphaFold</article-title>. <source>Nature</source> <volume>596</volume>, <fpage>583</fpage>&#x2013;<lpage>589</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-021-03819-2</pub-id>
<pub-id pub-id-type="pmid">34265844</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kastenhuber</surname>
<given-names>E. R.</given-names>
</name>
<name>
<surname>Lowe</surname>
<given-names>S. W.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Putting p53 in context</article-title>. <source>Cell</source> <volume>170</volume> (<issue>6</issue>), <fpage>1062</fpage>&#x2013;<lpage>1078</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2017.08.028</pub-id>
<pub-id pub-id-type="pmid">28886379</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kohn</surname>
<given-names>K. W.</given-names>
</name>
<name>
<surname>Yves</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Molecular interaction map of the P53 and Mdm2 logic elements, which control the Off&#x2013;on switch of P53 in response to DNA damage</article-title>. <source>Biochem. Biophysical Res. Commun.</source> <volume>331</volume> (<issue>3</issue>), <fpage>816</fpage>&#x2013;<lpage>827</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbrc.2005.03.186</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kussie</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Gorina</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Marechal</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Elenbaas</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Moreau</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Levine</surname>
<given-names>A. J.</given-names>
</name>
<etal/>
</person-group> (<year>1996</year>). <article-title>Structure of the MDM2 oncoprotein bound to the P53 tumor suppressor transactivation domain</article-title>. <source>Science</source> <volume>274</volume>, <fpage>948</fpage>&#x2013;<lpage>953</lpage>. <pub-id pub-id-type="doi">10.1126/science.274.5289.948</pub-id>
<pub-id pub-id-type="pmid">8875929</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lalli</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Zambetti</surname>
<given-names>G. P.</given-names>
</name>
<name>
<surname>Ribeiro</surname>
<given-names>R. C.</given-names>
</name>
<name>
<surname>Figueiredo</surname>
<given-names>B. C.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Cancer associated to low-penetrance TP53 variants: insights from P.R337H</article-title>. <source>Trends Cancer</source> <volume>11</volume> (<issue>6</issue>), <fpage>499</fpage>&#x2013;<lpage>502</lpage>. <pub-id pub-id-type="doi">10.1016/j.trecan.2025.04.003</pub-id>
<pub-id pub-id-type="pmid">40268607</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Maksoud</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Structural basis of error-prone DNA synthesis by DNA polymerase</article-title>. <source>Nat. Commun.</source> <volume>16</volume> (<issue>1</issue>), <fpage>2063</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-025-57269-9</pub-id>
<pub-id pub-id-type="pmid">40021647</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Miller</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lubkowski</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Rao</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Danishefsky</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Omichinski</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Sakaguchi</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>1999</year>). <article-title>The oligomerization domain of P53: crystal structure of the trigonal form</article-title>. <source>FEBS Lett.</source> <volume>399</volume> (<issue>1&#x2013;2</issue>), <fpage>166</fpage>&#x2013;<lpage>170</lpage>. <pub-id pub-id-type="doi">10.1016/S0014-5793(96)01231-8</pub-id>
<pub-id pub-id-type="pmid">8980144</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mirdita</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sch&#xfc;tze</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Moriwaki</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Heo</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ovchinnikov</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Steinegger</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>ColabFold: making protein folding accessible to all</article-title>. <source>Nat. Methods</source> <volume>19</volume>, <fpage>679</fpage>&#x2013;<lpage>682</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-022-01488-1</pub-id>
<pub-id pub-id-type="pmid">35637307</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Parr</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>1989</year>). <source>Density-functional theory of atoms and molecules</source>. <publisher-name>Oxford University Press</publisher-name>.</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saiki</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Gelfand</surname>
<given-names>D. H.</given-names>
</name>
<name>
<surname>Stoffel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Scharf</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Higuchi</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Horn</surname>
<given-names>G. T.</given-names>
</name>
<etal/>
</person-group> (<year>1988</year>). <article-title>Primer-directed enzymatic amplification of DNA with a thermostable DNA polymerase</article-title>. <source>Science</source> <volume>239</volume> (<issue>4839</issue>), <fpage>487</fpage>&#x2013;<lpage>491</lpage>. <pub-id pub-id-type="doi">10.1126/science.2448875</pub-id>
<pub-id pub-id-type="pmid">2448875</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Senior</surname>
<given-names>A. W.</given-names>
</name>
<name>
<surname>Evans</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Jumper</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kirkpatrick</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sifre</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Improved protein structure prediction using potentials from deep learning</article-title>. <source>Nature</source> <volume>577</volume>, <fpage>706</fpage>&#x2013;<lpage>710</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-019-1923-7</pub-id>
<pub-id pub-id-type="pmid">31942072</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Molnar</surname>
<given-names>L. F.</given-names>
</name>
<name>
<surname>Jung</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kussmann</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ochsenfeld</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>S. T.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>Advances in methods and algorithms in a modern quantum chemistry program</article-title>. <source>PCCP</source> <volume>8</volume>, <fpage>3172</fpage>&#x2013;<lpage>3191</lpage>. <pub-id pub-id-type="doi">10.1039/b517914a</pub-id>
<pub-id pub-id-type="pmid">16902710</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Szabo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ostlund</surname>
<given-names>N. S.</given-names>
</name>
</person-group> (<year>1996</year>). <source>Modern quantum chemistry: introduction to advanced electronic structure theory</source>. <publisher-name>Dover Books</publisher-name>.</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Varadi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Anyango</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Deshpande</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nair</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Natassia</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yordanova</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>AlphaFold protein structure database: massively expanding the structural coverage of protein-sequence space</article-title>. <source>Nucleic Acids Res.</source> <volume>50</volume>, <fpage>D439</fpage>&#x2013;<lpage>D444</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkab1061</pub-id>
<pub-id pub-id-type="pmid">34791371</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Reed</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mayr</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Stenger</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Anderson</surname>
<given-names>M. E.</given-names>
</name>
<etal/>
</person-group> (<year>1994</year>). <article-title>P53 domains: structure, oligomerization, and transformation</article-title>. <source>Mol. Cell. Biol.</source> <volume>14</volume> (<issue>8</issue>), <fpage>5182</fpage>&#x2013;<lpage>5191</lpage>. <pub-id pub-id-type="doi">10.1128/mcb.14.8.5182</pub-id>
<pub-id pub-id-type="pmid">8035799</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1017997/overview">Patr&#xed;cia F. N. Fa&#xed;sca</ext-link>, University of Lisbon, Portugal</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3232824/overview">Adam Chamberlin</ext-link>, Ambry Genetics, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3331340/overview">A. Najla Hosseini</ext-link>, Karolinska Institutet (KI), Sweden</p>
</fn>
</fn-group>
</back>
</article>