<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1063620</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2022.1063620</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Effect of naturally-occurring mutations on the stability and function of cancer-associated NQO1: Comparison of experiments and computation</article-title>
<alt-title alt-title-type="left-running-head">Pacheco-Garcia et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fmolb.2022.1063620">10.3389/fmolb.2022.1063620</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Pacheco-Garcia</surname>
<given-names>Juan Luis</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2062408/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cagiada</surname>
<given-names>Matteo</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2043964/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tienne-Matos</surname>
<given-names>Kelly</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2042367/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Salido</surname>
<given-names>Eduardo</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lindorff-Larsen</surname>
<given-names>Kresten</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn2">
<sup>&#x2021;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/778347/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>L. Pey</surname>
<given-names>Angel</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<xref ref-type="fn" rid="fn2">
<sup>&#x2021;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/642905/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Departamento de Qu&#xed;mica-F&#xed;sica</institution>, <institution>Universidad de Granada</institution>, <addr-line>Granada</addr-line>, <country>Spain</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Biology</institution>, <institution>Linderstr&#xf8;m-Lang Centre for Protein Science</institution>, <institution>University of Copenhagen</institution>, <addr-line>Copenhagen</addr-line>, <country>Denmark</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Center for Rare Diseases (CIBERER)</institution>, <institution>Hospital Universitario de Canarias</institution>, <institution>Universidad de la Laguna</institution>, <addr-line>La Laguna</addr-line>, <country>Tenerife</country> <addr-line>Tenerife</addr-line>, <country>Spain</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Departamento de Qu&#xed;mica F&#xed;sica</institution>, <institution>Unidad de Excelencia en Qu&#xed;mica Aplicada a Biomedicina y Medioambiente e Instituto de Biotecnolog&#xed;a</institution>, <institution>Universidad de Granada</institution>, <addr-line>Granada</addr-line>, <country>Spain</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/60084/overview">Daniele Dell&#x2019;Orco</ext-link>, University of Verona, Italy</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1801605/overview">Roberta Chiaraluce</ext-link>, Sapienza University of Rome, Italy</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/54757/overview">Carlo Travaglini-Allocatelli</ext-link>, Sapienza University of Rome, Italy</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Angel L. Pey, <email>angelpey@ugr.es</email>
</corresp>
<fn fn-type="equal" id="fn1">
<p>
<sup>&#x2020;</sup>These authors have contributed equally to this work and share first authorship</p>
</fn>
<fn fn-type="equal" id="fn2">
<label>
<sup>&#x2021;</sup>
</label>
<p>These authors share senior authorship</p>
</fn>
<fn fn-type="other">
<p>This article was submitted to Biological Modeling and Simulation, a section of the journal Frontiers in Molecular Biosciences</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>24</day>
<month>11</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>9</volume>
<elocation-id>1063620</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>10</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>03</day>
<month>11</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Pacheco-Garcia, Cagiada, Tienne-Matos, Salido, Lindorff-Larsen and L. Pey.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Pacheco-Garcia, Cagiada, Tienne-Matos, Salido, Lindorff-Larsen and L. Pey</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Recent advances in DNA sequencing technologies are revealing a large individual variability of the human genome. Our capacity to establish genotype-phenotype correlations in such large-scale is, however, limited. This task is particularly challenging due to the multifunctional nature of many proteins. Here we describe an extensive analysis of the stability and function of naturally-occurring variants (found in the COSMIC and gnomAD databases) of the cancer-associated human NAD(P)H:quinone oxidoreductase 1 (NQO1). First, we performed <italic>in silico</italic> saturation mutagenesis studies (&#x3e;5,000 substitutions) aimed to identify regions in NQO1 important for stability and function. We then experimentally characterized twenty-two naturally-occurring variants in terms of protein levels during bacterial expression, solubility, thermal stability, and coenzyme binding. These studies showed a good overall correlation between experimental analysis and computational predictions; also the magnitude of the effects of the substitutions are similarly distributed in variants from the COSMIC and gnomAD databases. Outliers in these experimental-computational genotype-phenotype correlations remain, and we discuss these on the grounds and limitations of our approaches. Our work represents a further step to characterize the mutational landscape of NQO1 in the human genome and may help to improve high-throughput <italic>in silico</italic> tools for genotype-phenotype correlations in this multifunctional protein associated with disease.</p>
</abstract>
<kwd-group>
<kwd>protein function</kwd>
<kwd>protein stability</kwd>
<kwd>genotype-phenotype correlations</kwd>
<kwd>computational prediction</kwd>
<kwd>sequence conservation</kwd>
</kwd-group>
<contract-num rid="cn002">P18-RT-2413 B-BIO-84-UGR20</contract-num>
<contract-sponsor id="cn001">Ministerio de Ciencia, Innovaci&#xf3;n y Universidades<named-content content-type="fundref-id">10.13039/100014440</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">Consejer&#xed;a de Econom&#xed;a, Conocimiento, Empresas y Universidad, Junta de Andaluc&#xed;a<named-content content-type="fundref-id">10.13039/100016970</named-content>
</contract-sponsor>
<contract-sponsor id="cn003">Fundaci&#xf3;n para el Fomento de la Investigaci&#xf3;n Sanitaria y Biom&#xe9;dica de la Comunitat Valenciana<named-content content-type="fundref-id">10.13039/501100019157</named-content>
</contract-sponsor>
<contract-sponsor id="cn004">Novo Nordisk Fonden<named-content content-type="fundref-id">10.13039/501100009708</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Advances in technologies for whole-genome or exome sequencing and high-throughput functional assays have increased our knowledge on the consequences of the genetic variability in humans and the relationship to disease (<xref ref-type="bibr" rid="B29">McInnes et al., 2021</xref>; <xref ref-type="bibr" rid="B3">Arnedo-Pac et al., 2022</xref>; <xref ref-type="bibr" rid="B13">H&#xf8;ie et al., 2022</xref>; <xref ref-type="bibr" rid="B17">Katsonis et al., 2022</xref>). However, our capacity to predict the pathogenicity of single amino acid variants is still limited, with some approaches providing good overall results but failing to predict correlation for some individual mutations or phenotypes (<xref ref-type="bibr" rid="B17">Katsonis et al., 2022</xref>).</p>
<p>Current approaches for correlating genotype and phenotype can broadly be classified into two classes. First, experimental approaches are based on the characterization of one or several functional features (for example enzymatic function and regulation, protein-protein interactions, transport to different intracellular or extracellular locations, protein turnover, ligand binding) (<xref ref-type="bibr" rid="B54">Xu et al., 2017</xref>; <xref ref-type="bibr" rid="B1">Abildgaard et al., 2019</xref>; <xref ref-type="bibr" rid="B38">Pacheco-Garcia et al., 2021</xref>; <xref ref-type="bibr" rid="B13">H&#xf8;ie et al., 2022</xref>). In the case of high-throughput experimental approaches typically only one or two aspects of protein function are analysed (for example protein abundance or ability to rescue a growth phenotype) (<xref ref-type="bibr" rid="B8">Cagiada et al., 2021</xref>). Second, the use of structure- or sequence-based methods to predict pathogenicity are becoming increasingly robust (<xref ref-type="bibr" rid="B1">Abildgaard et al., 2019</xref>; <xref ref-type="bibr" rid="B3">Arnedo-Pac et al., 2022</xref>; <xref ref-type="bibr" rid="B13">H&#xf8;ie et al., 2022</xref>). Although experiments may be implemented in a high-throughput fashion, it has until now been limited to a relatively small set of proteins and assays (<xref ref-type="bibr" rid="B3">Arnedo-Pac et al., 2022</xref>; <xref ref-type="bibr" rid="B13">H&#xf8;ie et al., 2022</xref>). Thus, while computational approaches also have limitations, they may be appealing due to their potential application on a proteomic scale (<xref ref-type="bibr" rid="B3">Arnedo-Pac et al., 2022</xref>; <xref ref-type="bibr" rid="B13">H&#xf8;ie et al., 2022</xref>).</p>
<p>In this work, we apply both types of approaches to increase our understanding of the correlation between genotype and phenotype for missense variants of the human NAD(P)H:quinone oxidoreductase 1 (NQO1) protein. NQO1 is associated with several diseases including cancer, Alzheimer&#xb4;s and Parkinson&#x2019;s disease (<xref ref-type="bibr" rid="B6">Beaver et al., 2019</xref>; <xref ref-type="bibr" rid="B23">Luo et al., 2019</xref>). NQO1 is a multifunctional protein, displaying both enzymatic and non-enzymatic functions. As an enzyme, it catalyzes the FAD-dependent (two-electron) reduction of a large set of quinone substrates, with functions including redox maintenance of vitamins, detoxification of xenobiotics and activation of cancer pro-drugs (<xref ref-type="bibr" rid="B47">Ross and Siegel, 2018</xref>; <xref ref-type="bibr" rid="B6">Beaver et al., 2019</xref>; <xref ref-type="bibr" rid="B2">Anoz-Carbonell et al., 2020</xref>; <xref ref-type="bibr" rid="B48">Salido et al., 2022</xref>). Among non-enzymatic functions, NQO1 may interact with proteins and RNA, controlling their stability and function (<xref ref-type="bibr" rid="B6">Beaver et al., 2019</xref>; <xref ref-type="bibr" rid="B5">Asher et al., 2005</xref>; <xref ref-type="bibr" rid="B7">Ben-Nissan and Sharon, 2014</xref>; <xref ref-type="bibr" rid="B9">di Francesco et al., 2016</xref>; <xref ref-type="bibr" rid="B36">Oh et al., 2016</xref>). Many of these functions are associated with the catalytic competence and FAD binding, such as protein-protein interactions, intracellular stability and association with microtubules (<xref ref-type="bibr" rid="B5">Asher et al., 2005</xref>; <xref ref-type="bibr" rid="B27">Mart&#xed;nez-Lim&#xf3;n et al., 2016</xref>; <xref ref-type="bibr" rid="B28">Mart&#xed;nez-Lim&#xf3;n et al., 2020</xref>; <xref ref-type="bibr" rid="B49">Siegel et al., 2021</xref>). The native form of NQO1 is dimeric, containing two different domains: an N-terminal domain (NTD, residues 1&#x2013;225), that tightly binds one FAD molecule/domain required for catalysis and contains most of the monomer-monomer interface (MMI), whereas the C-terminal domain (CTD, residues 225&#x2013;274) complete the active site and the MMI (<xref ref-type="bibr" rid="B20">Li et al., 1995</xref>; <xref ref-type="bibr" rid="B10">Faig et al., 2000</xref>; <xref ref-type="bibr" rid="B21">Lienhart et al., 2014</xref>; <xref ref-type="bibr" rid="B32">Medina-Carmona et al., 2017a</xref>; <xref ref-type="bibr" rid="B38">Pacheco-Garcia et al., 2021</xref>).</p>
<p>We have recently shown that ligand binding and variant effects on stability propagate to long distances in the native state, affecting different functional features in a counterintuitive fashion (<xref ref-type="bibr" rid="B33">Medina-Carmona et al., 2016</xref>; <xref ref-type="bibr" rid="B43">Pey, 2018</xref>; <xref ref-type="bibr" rid="B30">Medina-Carmona et al., 2019a</xref>; <xref ref-type="bibr" rid="B52">Vankova et al., 2019</xref>; <xref ref-type="bibr" rid="B39">Pacheco-Garc&#xed;a et al., 2020</xref>; <xref ref-type="bibr" rid="B38">Pacheco-Garcia et al., 2021</xref>; <xref ref-type="bibr" rid="B37">Pacheco-Garcia et al., 2022a</xref>). Therefore, NQO1 represents a challenging and biomedically relevant system to compare the performance of computational and experimental methods to explain and to predict genotype-phenotype in a large-scale for a multi-functional protein. Here, we use computational tools to probe 5,187 variants of NQO1 that includes a set of clinically relevant missense variants which we then experimentally characterized. In this set, thirteen variants come from large-scale human sequencing data (gnomAD) and nine from the catalogue of somatic mutations in human cancer lines (COSMIC) (<xref ref-type="table" rid="T1">Table 1</xref>). As of ninth of January 2022, none of these variants were found in both databases. Whether variants found in COSMIC or gnomAD databases are associated with disease (e.g. predisposition to cancer development) is unknown. The set of variants we studied experimentally comprises very different amino acid side chain characteristics and display different levels of solvent exposure (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Set of NQO1 variants experimentally characterized in this work.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Mutation</th>
<th align="left">Database</th>
<th align="left">% ASA<xref ref-type="table-fn" rid="Tfn1">
<sup>a</sup>
</xref>
</th>
<th align="left">Variant class</th>
<th align="left">Residue class</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">G3S</td>
<td align="left">gnomAD</td>
<td align="left">6.0 &#xb1; 4.7</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">G3D</td>
<td align="left">COSMIC</td>
<td align="left">6.0 &#xb1; 4.7</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">L7P</td>
<td align="left">COSMIC</td>
<td align="left">0.3 &#xb1; 0.2</td>
<td align="left">Total-loss</td>
<td align="left">Total-loss</td>
</tr>
<tr>
<td align="left">L7R</td>
<td align="left">gnomAD</td>
<td align="left">0.3 &#xb1; 0.2</td>
<td align="left">Total-loss</td>
<td align="left">Total-loss</td>
</tr>
<tr>
<td align="left">V9I</td>
<td align="left">gnomAD</td>
<td align="left">0.0 &#xb1; 0.0</td>
<td align="left">WT-like</td>
<td align="left">Total-loss</td>
</tr>
<tr>
<td align="left">T16M</td>
<td align="left">gnomAD</td>
<td align="left">43 &#xb1; 14</td>
<td align="left">Stable but inactive</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">Y20N</td>
<td align="left">gnomAD</td>
<td align="left">21 &#xb1; 5</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">A29T</td>
<td align="left">COSMIC</td>
<td align="left">2.2 &#xb1; 0.5</td>
<td align="left">WT-like</td>
<td align="left">Unstable but active</td>
</tr>
<tr>
<td align="left">K32N</td>
<td align="left">gnomAD</td>
<td align="left">79 &#xb1; 11</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">G34V</td>
<td align="left">gnomAD</td>
<td align="left">54 &#xb1; 11</td>
<td align="left">Total-loss</td>
<td align="left">Stable but Inactive</td>
</tr>
<tr>
<td align="left">E36K</td>
<td align="left">gnomAD</td>
<td align="left">64 &#xb1; 3</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">S40L</td>
<td align="left">gnomAD</td>
<td align="left">0.0 &#xb1; 0.0</td>
<td align="left">WT-like</td>
<td align="left">Total-loss</td>
</tr>
<tr>
<td align="left">D41G</td>
<td align="left">gnomAD</td>
<td align="left">14 &#xb1; 2</td>
<td align="left">Total-loss</td>
<td align="left">Stable but inactive</td>
</tr>
<tr>
<td align="left">D41Y</td>
<td align="left">COSMIC</td>
<td align="left">14 &#xb1; 2</td>
<td align="left">Stable but inactive</td>
<td align="left">Stable but inactive</td>
</tr>
<tr>
<td align="left">M45L</td>
<td align="left">COSMIC</td>
<td align="left">28 &#xb1; 5</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">M45I</td>
<td align="left">COSMIC</td>
<td align="left">28 &#xb1; 5</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">I51V</td>
<td align="left">gnomAD</td>
<td align="left">14 &#xb1; 1</td>
<td align="left">WT-like</td>
<td align="left">Stable but inactive</td>
</tr>
<tr>
<td align="left">W106R</td>
<td align="left">gnomAD</td>
<td align="left">10 &#xb1; 1</td>
<td align="left">Total-loss</td>
<td align="left">Total-loss</td>
</tr>
<tr>
<td align="left">W106C</td>
<td align="left">COSMIC</td>
<td align="left">10 &#xb1; 1</td>
<td align="left">Total-loss</td>
<td align="left">Total-loss</td>
</tr>
<tr>
<td align="left">F107C</td>
<td align="left">gnomAD</td>
<td align="left">7.6 &#xb1; 0.5</td>
<td align="left">Unstable but active</td>
<td align="left">Unstable but active</td>
</tr>
<tr>
<td align="left">M155I</td>
<td align="left">COSMIC</td>
<td align="left">13 &#xb1; 3</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
<tr>
<td align="left">H162N</td>
<td align="left">COSMIC</td>
<td align="left">6.6 &#xb1; 0.5</td>
<td align="left">WT-like</td>
<td align="left">WT-like</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The table indicates whether the variants are found in the COSMIC/gnomAD databases as well as the solvent exposure (as % ASA) determined using a crystallographic model of WT NQO1 [PDB code 2F1O (<xref ref-type="bibr" rid="B4">Asher et al., 2006</xref>)], the software Getarea and the computational classification at variant and residue level using a combination of predictions of thermodynamic stability change upon mutation and evolutionary conservation.</p>
</fn>
<fn id="Tfn1">
<label>
<sup>a</sup>
</label>
<p>Using GetArea (<ext-link ext-link-type="uri" xlink:href="http://curie.utmb.edu/getarea.html">http://curie.utmb.edu/getarea.html</ext-link>) and the structure with PDB code 2F1O (<xref ref-type="bibr" rid="B4">Asher et al., 2006</xref>). Data are the average &#xb1;s.d. from eight monomers.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Materials and methods</title>
<sec id="s2-1">
<title>2.1 Experimental methods</title>
<sec id="s2-1-1">
<title>2.1.1 Protein expression and purification</title>
<p>Mutations were introduced by site-directed mutagenesis in the wild-type (WT) NQO1 cDNA cloned into the pET-15b vector (pET-15b-NQO1) by GenScript (Leiden, Netherlands). Mutated codons were optimized for expression in <italic>E. coli</italic> and mutagenesis was confirmed by sequencing the entire cDNA. The plasmids were transformed in <italic>E. coli</italic> BL21 (DE3) cells (Agilent Technologies, Santa Clara, CA, United States) for protein expression.</p>
<p>To determine the amount of soluble NQO1 at 37&#xb0;C, 5&#xa0;ml of LB medium containing 0.1&#xa0;mg mL<sup>&#x2212;1</sup> ampicillin (purchased from Canvax Biotech, C&#xf3;rdoba, Spain) was inoculated with transformed cells and grown for 16&#xa0;h at 37&#xb0;C. 0.5&#xa0;ml of these cultures were diluted into 10&#xa0;ml of LB containing 0.1&#xa0;mg mL<sup>&#x2212;1</sup> ampicillin (LBA) and grown at 37&#xb0;C for 3&#xa0;h. After that, cultures were induced with 0.5&#xa0;mM of isopropyl &#x3b2;-D-1-thiogalactopyranoside (IPTG, Canvax Biotech) at 37&#xa0;&#xb0;C for 4&#xa0;h. Cells were harvested by centrifugation at 2,900&#xa0;<italic>g</italic> in a bench centrifuge at 4&#xb0;C and frozen at &#x2212;80&#xb0;C for 16&#xa0;h. Pellets were resuspended in binding buffer (20&#xa0;mM Na-phosphate, 300&#xa0;mM NaCl, 50&#xa0;mM imidazole, pH 7.4) with 1&#xa0;mM phenylmethylsulfonyl fluoride (PMSF, Sigma-Aldrich, Madrid, Spain) and sonicated in an ice bath. These <italic>total extracts</italic> were centrifugated (24,000&#xa0;<italic>g</italic>, 30&#xa0;min, 4&#xb0;C in a bench centrifuge) to obtain the <italic>soluble extracts</italic>. The amount of NQO1 in total and soluble extracts was determined by Western-blotting providing the S/T (soluble/total) ratio for each variant. Samples were denatured using Laemmli&#x2019;s buffer, resolved in polyacrylamide gel electrophoresis in the presence of sodium dodecylsulphate (SDS-PAGE, 12% acrylamide) gels and transferred to PVDF membranes (GE Healthcare, Chicago, IL, United States) using standard procedures. Immunoblotting was carried out using primary monoclonal antibody against NQO1 (sc-393736, Santa Cruz Biotechnology, Dallas, TX, United States) at 1:500 dilution and, as secondary antibody, an anti-mouse IgG&#x3ba; BP-HRP (sc-516102, Santa Cruz Biotechnology) at 1:2000 dilution was used. Samples were visualized using luminol-based enhanced chemiluminescence (from BioRad Laboratories, Hercules, CA, United States), scanned and analysed using Image Lab (from BioRad Laboratories).</p>
<p>For large-scale purifications, a preculture (100&#xa0;ml) was prepared from a single clone for each variant and grown for 16&#xa0;h at 37&#xb0;C in LBA and diluted into 2.4&#x2013;4.8&#xa0;L of LBA. After 3&#xa0;h at 37&#xb0;C, NQO1 expression was induced by the addition of 0.5&#xa0;mM IPTG for 6&#xa0;h at 25&#xb0;C. Cells were harvested by centrifugation at 8,000&#xa0;<italic>g</italic> and frozen overnight at &#x2212;80&#xa0;&#xb0;C. NQO1 proteins were purified using immobilized nickel affinity chromatography columns (IMAC, GE Healthcare) as described (<xref ref-type="bibr" rid="B2">Anoz-Carbonell et al., 2020</xref>). Isolated dimeric fractions of NQO1 variants were exchanged to HEPES-KOH buffer 50&#xa0;mM pH 7.4 using PD-10 columns (GE Healthcare). The UV&#x2013;visible spectra of purified NQO1 proteins were measured in a Cary spectrophotometer (Agilent Technologies, Waldbronn, Germany) and used to quantify NQO1 concentration and the content of FAD as described in (<xref ref-type="bibr" rid="B2">Anoz-Carbonell et al., 2020</xref>). Apo-proteins were obtained as described in (<xref ref-type="bibr" rid="B52">Vankova et al., 2019</xref>). Briefly, holo-proteins were incubated with 2&#xa0;M urea and 2&#xa0;M KBr in HEPES-KOH 50&#xa0;mM pH 7.4 in the presence of 2&#xa0;mM &#x3b2;-mercaptoethanol and 1&#xa0;mM PMSF and loaded into IMAC columns, washed with 2&#xa0;M urea and 2&#xa0;M KBr in HEPES-KOH 50&#xa0;mM pH 7.4, 2&#xa0;mM &#x3b2;-mercaptoethanol, then with HEPES-KOH 50&#xa0;mM pH 7.4, 2&#xa0;mM &#x3b2;-mercaptoethanol eluted with 20&#xa0;mM Na-Phosphate 300&#xa0;mM NaCl 500&#xa0;mM imidazole pH 7.4 and finally exchanged to HEPES-KOH 50&#xa0;mM pH 7.4. These apo-proteins contained less than 2% bound FAD based on UV-visible spectra. Samples were stored at &#x2212;80&#xb0;C upon flash freezing in liquid N<sub>2</sub>. Protein purity and integrity was checked by SDS-PAGE.</p>
</sec>
<sec id="s2-1-2">
<title>2.1.2 <italic>In vitro</italic> characterization of NQO1 variants</title>
<p>Thermal denaturation of NQO1 proteins, as holo-proteins (2&#xa0;&#x3bc;M in monomer &#x2b;100&#xa0;&#x3bc;M FAD) was monitored by following changes in tryptophan emission fluorescence in HEPES-KOH 50&#xa0;mM at pH 7.4 as described in (<xref ref-type="bibr" rid="B31">Medina-Carmona et al., 2017b</xref>). <italic>T</italic>
<sub>m</sub> values were reported as mean &#xb1; s.d. of four independent measurements.</p>
<p>Fluorescence titrations were carried out at 25&#xb0;C using 1&#xa0;cm &#xd7; 0.3&#xa0;cm path-length cuvettes in a Cary Eclipse spectrofluorimeter (Agilent Technologies, Waldbronn, Germany). Experiments were performed in 20&#xa0;mM K-phosphate, pH 7.4, essentially as described in (<xref ref-type="bibr" rid="B39">Pacheco-Garc&#xed;a et al., 2020</xref>). Briefly, apo-NQO1 (0.25&#xa0;&#xb5;M in subunit) was mixed with 0&#x2013;2&#xa0;&#x3bc;M FAD in K-phosphate 20&#xa0;mM pH 7.4. Samples were incubated at 25&#xb0;C in the dark for at least 10&#xa0;min before measurements. Spectra were acquired in the 340&#x2013;360&#xa0;nm range upon excitation at 280&#xa0;nm (slits 5&#xa0;nm), and spectra were averaged over 10 scans registered at a scan rate of 200&#xa0;nm min<sup>&#x2212;1</sup>. FAD binding fluorescence intensities at 350&#xa0;nm were fitted using a single and identical type of binding sites as described in (<xref ref-type="bibr" rid="B39">Pacheco-Garc&#xed;a et al., 2020</xref>). Variant effects on the FAD binding free energy (&#x394;&#x394;G<sub>FAD</sub>) were calculated as:<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:mo>&#x2206;</mml:mo>
<mml:mo>&#x2206;</mml:mo>
<mml:msub>
<mml:mi>G</mml:mi>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>D</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>&#xb7;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mo>&#xb7;</mml:mo>
<mml:mi>ln</mml:mi>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>Where R is the ideal gas constant (1.987&#xa0;cal mol&#xb7;K<sup>&#x2212;1</sup>), T is the experimental temperature (298.15&#xa0;K), and <italic>K</italic>
<sub>d(mut)</sub> and <italic>K</italic>
<sub>d(WT)</sub> are the FAD binding dissociation constant of the mutant and WT protein variants, respectively. A positive value of &#x394;&#x394;G<sub>FAD</sub> indicates that the mutation reduces the affinity for FAD.</p>
<p>For proteolysis studies, NQO1 samples (10&#xa0;&#x3bc;M in monomer) were prepared in HEPES-KOH 50&#xa0;mM at pH 7.4 in the presence of 100&#xa0;&#x3bc;M FAD (NQO1<sub>holo</sub>) and incubated at 25<sup>o</sup>C for 5&#xa0;min. The proteolysis reaction was initiated upon addition of 0.02&#x2013;1.2&#xa0;&#x3bc;M thermolysin (from <italic>Geobacillus stearothermophilus</italic>, Sigma-Aldrich) and a final concentration of 10&#xa0;mM CaCl<sub>2</sub>. Samples were incubated at 25&#xb0;C and aliquots were collected over time and the reaction quenched by addition of EDTA pH 8 (final concentration of 20&#xa0;mM) and Laemmli&#xb4;s buffer (2x). Controls (time 0) were prepared likewise but without thermolysin. Samples were resolved by SDS-PAGE under reducing conditions in gels containing 12% acrylamide. Gels were stained with Coomassie blue G-250. Densitometry was carried out using ImageJ. Data were analyzed using an exponential function to provide the apparent rate constant (<italic>k</italic>
<sub>obs</sub>). From the linear dependence of <italic>k</italic>
<sub>obs</sub> vs. [thermolysin], we obtained the second-order rate constant <italic>k</italic>
<sub>prot</sub>. Linearity in these plot indicate that proteolysis occurs under a EX2 mechanism, thus reflecting the thermodynamic stability of the thermolysin cleavage site (Ser72-Val73) between non-cleavable and cleavable states (<xref ref-type="bibr" rid="B41">Park and Marqusee, 2004</xref>). These <italic>k</italic>
<sub>prot</sub> values were used to determine mutational effects on the local stability of thermolysin cleave site (&#x394;&#x394;G<sub>PROT</sub>) using <xref ref-type="disp-formula" rid="e2">Eq. 2</xref>:<disp-formula id="e2">
<mml:math id="m2">
<mml:mrow>
<mml:mo>&#x2206;</mml:mo>
<mml:mo>&#x2206;</mml:mo>
<mml:msub>
<mml:mi>G</mml:mi>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>R</mml:mi>
<mml:mi>O</mml:mi>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>&#xb7;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mo>&#xb7;</mml:mo>
<mml:mi mathvariant="italic">ln</mml:mi>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>k</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>t</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>k</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>t</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>Where R is the ideal gas constant (1.987&#xa0;cal mol&#xb7;K<sup>&#x2212;1</sup>), T is the experimental temperature (298.15&#xa0;K), and <italic>k</italic>
<sub>prot(mut)</sub> and <italic>k</italic>
<sub>prot(WT)</sub> are the second-order proteolysis rate constants of the mutant and WT protein variants, respectively. A positive value of &#x394;&#x394;G<sub>PROT</sub> indicates that the mutation thermodynamically destabilizes the thermolysin cleavage site.</p>
</sec>
</sec>
<sec id="s2-2">
<title>2.2 Computational analyses</title>
<sec id="s2-2-1">
<title>2.2.1 Evolutionary conservation analysis</title>
<p>We used GEMME (<xref ref-type="bibr" rid="B18">Laine et al., 2019</xref>) to evaluate evolutionary distances from the WT NQO1 sequence (Uniprot ID: P15559 &#x2014; isoform 1). We used HHblits (<xref ref-type="bibr" rid="B46">Remmert et al., 2011</xref>; <xref ref-type="bibr" rid="B51">Steinegger et al., 2019</xref>) to generate a multiple sequence alignment (MSA) using UniClust30 as sequence database and an E-value threshold of 10<sup>&#x2212;10</sup>. The resulting MSA contained 1,602 sequences and was refined using two additional filters: first, all the columns that were not present in the WT NQO1 sequence were removed; second, all the sequences with more than the 50% of gaps were removed. Application of these two filters yielded 1,414 sequences in the MSA. The GEMME package was run using default parameters. For each position, a median score was evaluated using all the available substitutions.</p>
</sec>
<sec id="s2-2-2">
<title>2.2.2 Thermodynamic stability predictions</title>
<p>Changes in thermodynamic stability (&#x394;&#x394;G) were calculated using the crystal structure (<xref ref-type="bibr" rid="B10">Faig et al., 2000</xref>) (PDB 1D4A) and the Rosetta package (GitHub SHA1 c7009b3115c22daa9efe2805d9d1ebba08426a54) with the Cartesian &#x394;&#x394;G protocol (<xref ref-type="bibr" rid="B42">Park et al., 2016</xref>; <xref ref-type="bibr" rid="B12">Frenz et al., 2020</xref>). The values obtained from Rosetta in internal Energy Unit were divided by 2.9 to bring them on to a scale corresponding to kcal&#xb7;mol<sup>&#x2212;1</sup> (<xref ref-type="bibr" rid="B42">Park et al., 2016</xref>). Median scores were evaluated for each position using all the available substitutions.</p>
<p>We used DSSP (<xref ref-type="bibr" rid="B16">Kabsch and Sander, 1983</xref>) to calculate the solvent accessible surface area (SASA) when identifying interface residues in NQO1. Interface residues were defined as those residues for a difference larger than 0.2 was detected between SASA calculations based on the dimer and monomer structure.</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Saturation mutagenesis by computational methods</title>
<p>We first used the predictive ability of evolutionary conservation analysis combined with thermodynamic stability calculations to classify all possible variants (i.e. saturation mutagenesis) in NQO1 based on their effects on the protein function and stability (<xref ref-type="bibr" rid="B8">Cagiada et al., 2021</xref>). For evolutionary conservation studies, we used GEMME (<xref ref-type="bibr" rid="B18">Laine et al., 2019</xref>) which provides a score (&#x394;E) for all possible single amino acid change variants of NQO1 (<xref ref-type="sec" rid="s10">Supplementary Figure S1A</xref>). &#x394;E represents the evolutionary distance of a variant from the WT NQO1 sequence, and &#x394;E has been shown to be a useful predictor of the deleterious effects on function and stability of the given substitution. We used Rosetta (<xref ref-type="bibr" rid="B42">Park et al., 2016</xref>) to predict variant effects on thermodynamic stability (&#x394;&#x394;G) using a crystal structure of NQO1 (<xref ref-type="bibr" rid="B10">Faig et al., 2000</xref>) as input (<xref ref-type="sec" rid="s10">Supplementary Figure S1B</xref>) and subsequently calculated the median &#x394;&#x394;G for all variants at each position. We performed &#x394;&#x394;G evaluations using both the monomeric and dimeric structure of NQO1 to separate effects on overall stability and effects on dimerization. Specifically, we calculated &#x394;&#x394;G from the monomer (<xref ref-type="sec" rid="s10">Supplementary Figures S1B,S2A</xref>) to predict the change in thermodynamic stability relative to wild type of each variant. We also performed similar &#x394;&#x394;G calculations using the dimer structure as input (<xref ref-type="sec" rid="s10">Supplementary Figures S1C,S2B</xref>), introducing each missense variant in both chains (i.e., treating this as a homodimer) and used the resulting values to compare with experiments. Based on these two calculations, we also evaluated the &#x394;&#x394;G of dimerization as the difference between the two Rosetta runs (<xref ref-type="sec" rid="s10">Supplementary Figures S2C,D</xref>) to highlight which residues are involved in stabilizing the dimer and thus also those variants that might weaken dimer formation. Then, we evaluated the difference in the SASA between the dimeric and monomeric residues of NQO1 (<xref ref-type="sec" rid="s10">Supplementary Figure S2C</xref>) and we classified 33 of them as interface residues. We found that for 20 of these interface residues the median &#x394;&#x394;G of dimerization was &#x3e;1&#xa0;kcal mol<sup>&#x2212;1</sup>. Of these 20, 15 were stable upon mutation in the monomeric form (median &#x394;&#x394;G &#x3c;2&#xa0;kcal mol<sup>&#x2212;1</sup>) and a subset of seven display a median &#x394;&#x394;G of dimerization &#x3e;2&#xa0;kcal mol<sup>&#x2212;1</sup>.</p>
<p>Then, we combined the evolutionary conservation scores and stability calculations based on the monomeric protein for the 5,187 variants of NQO1 and plotted the results in a two-dimensional histogram (<xref ref-type="fig" rid="F1">Figure 1A</xref>). We used cutoff values of 2&#xa0;kcal mol<sup>&#x2212;1</sup> for Rosetta &#x394;&#x394;G values and -3 for GEMME &#x394;E scores as thresholds for all the variants in order to separate them based on their effects (<xref ref-type="bibr" rid="B23">Luo et al., 2019</xref>). To ease analyses and interpretations, we associated each of the four defined regions with a color (<xref ref-type="bibr" rid="B8">Cagiada et al., 2021</xref>). &#x2018;WT-like&#x2019; variants represent 48% of the available NQO1 variants (shown in green). 20% of NQO1 substitutions show high &#x394;&#x394;G and high evolutionary distances and are classified as &#x201c;Total-loss.&#x201d; These variants have substitutions that are unlikely in the evolutionary analysis (&#x394;E &#x3c; &#x2212;3) and lead to decreased stability (&#x394;&#x394;G &#x3e;2&#xa0;kcal mol<sup>&#x2212;1</sup>); they thus likely compromise protein function <italic>via</italic> loss of protein stability (colored in red). Variants with high negative &#x394;E and low &#x394;&#x394;G belong to the &#x201c;Stable but inactive&#x201d; class (colored in blue). This class contains 24% of the variants and represent those for which the evolutionary and stability analysis suggests that the protein function has been compromised, but not for stability reasons. Lastly, the remaining 8% of the variants show low stability and low evolutionary distance, and were classified as &#x201c;Unstable but active&#x201d; (colored in yellow). Having predicted the effects of all possible missense variants, we performed a similar classification of amino acid positions, assigning the most common variant class to each position (<xref ref-type="fig" rid="F1">Figures 1C,D</xref>) and found 48% of the total positions classified as &#x201c;WT-like,&#x201d; 25% as &#x201c;-Total-loss,&#x201d; 22% as &#x201c;Stable but inactive&#x201d; and 5% as &#x201c;Unstable but active.&#x201d;</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Saturation mutagenesis of NQO1 based on computational methods. <bold>(A)</bold> Two-dimensional histogram which combines the data from the evolutionary conservation analysis (&#x394;E, <italic>y</italic>-axis) with the thermodynamic stability (&#x394;&#x394;G, <italic>x</italic>-axis) data from Rosetta on the NQQ1 monomer. The variants are categorized in one of the four regions, which are delimited by dashed lines. The fraction of variants, class and colour assigned to each region are indicated. The four classes of variants/positions are reported at the bottom of the figure: &#x201c;WT-like&#x201d; (Green), &#x201c;Low stability, active&#x201d; (yellow), &#x201c;Stable but inactive&#x201d; (blue) and &#x201c;Total-loss&#x201d; (red). <bold>(B)</bold> The scores of gnomAD (grey) and COSMIC (orange) variants in the 2D histogram. <bold>(C)</bold> The positional colour categories assigned using the most common colour of the position in the sequence together with the secondary structure. <bold>(D)</bold> The positional classification mapped to the protein crystal structure (PDB: 1D4A) (<xref ref-type="bibr" rid="B10">Faig et al., 2000</xref>).</p>
</caption>
<graphic xlink:href="fmolb-09-1063620-g001.tif"/>
</fig>
<p>In addition, we used the data from the dimer analysis to evaluate the number of residues involved in the stabilization of the dimer form. We found that 14 residues at the interface changed their classification to &#x201c;Total-loss&#x201d; if &#x394;&#x394;G was evaluated using the dimer structure. Of these 14, 9 were classified as &#x201c;Stable but inactive,&#x201d; while 5 were classified as WT-like using monomeric &#x394;&#x394;G data. Thus, many residues at the interface appear to be conserved during evolution to preserve the stability of the dimeric form of NQO1.</p>
<p>Having analyzed all possible missense variants, we next looked at the results for a subset of variants that have been found in the human population. Specifically, we looked at variants that are found in the COSMIC (COSMIC v.92; <ext-link ext-link-type="uri" xlink:href="https://cancer.sanger.ac.uk/cosmic">https://cancer.sanger.ac.uk/cosmic</ext-link>) or gnomAD (gnomAD v.2.1.1; <ext-link ext-link-type="uri" xlink:href="https://gnomad.broadinstitute.org/">https://gnomad.broadinstitute.org/</ext-link>) databases, and did not find clear differences between these two sets (<xref ref-type="fig" rid="F1">Figure 1B</xref>). In particular, we found variants in both sets that would be predicted as functional and others for which stability and/or conservation analyses predict loss-of-function (LoF). This result is in line with the notion that both databases may contain both potentially pathogenic as well as benign variants.</p>
</sec>
<sec id="s3-2">
<title>3.2 Selection of NQO1 variants to be experimentally characterized</title>
<p>After studying the NQO1 variants computationally, we next examined a set of the variants using a series of different experiments. In this study, we have thus extended our previous work on 8 naturally-occurring variants in NQO1 (<xref ref-type="bibr" rid="B39">Pacheco-Garc&#xed;a et al., 2020</xref>) to a set of 22 variants (<xref ref-type="table" rid="T1">Table 1</xref>; <xref ref-type="fig" rid="F2">Figure 2</xref>). Overall, this set included thirteen variants found in the gnomAD database and nine variants found in the COSMIC database. Seventeen of these variants clustered in the N-terminal part of the protein (residues 1&#x2013;51), whereas five were located in the segment comprising residues 106&#x2013;162 (in close proximity to the active site). Nine variants affected residues buried inside the protein structure (with less than 10% of SASA), whereas the rest are at positions that are partially or highly solvent-exposed (<xref ref-type="table" rid="T1">Table 1</xref>). The chemical nature of the changes introduced by the substitutions is also quite diverse, and the substitutions are located in different elements of secondary structure (<xref ref-type="fig" rid="F2">Figure 2B</xref>). Based on our computational analysis the 22 variants represent well the heterogeneous scale of effects on NQO1 function and stability. Indeed, of the 22 variants selected 14 are classified by the computational models as &#x201c;WT-like,&#x201d; 4 as &#x201c;Total-loss&#x201d; and 4 as &#x201c;stable but inactive.&#x201d;</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Structural features and local stability of the substituted residues and the variants characterized experimentally in this work. <bold>(A)</bold> The residues mutated were mapped onto the structure of NQO1 (PDB code 2F1O) (<xref ref-type="bibr" rid="B4">Asher et al., 2006</xref>). Residues are depicted as spheres, and the colour code indicates substitutions located in the 1&#x2013;51 region (orange) or the active site (red). Variants were labelled in red (from COSMIC) or in green (from gnomAD). FAD and Dic are shown as dot representations in cyan and blue, respectively. <bold>(B)</bold> Location of substitutions in the sequence of NQO1 regarding secondary structure elements (from (<xref ref-type="bibr" rid="B10">Faig et al., 2000</xref>)). Substitutions were labelled in red (from COSMIC) or in green (from gnomAD). <bold>(C)</bold> HDX of segments containing the 22 variants experimentally investigated in this work. The segments are labelled in blue. The colour code corresponds to HDX for NQO1<sub>apo</sub>, NQO1<sub>holo</sub> and NQO1<sub>dic</sub> states. HDX data are from (<xref ref-type="bibr" rid="B52">Vankova et al., 2019</xref>).</p>
</caption>
<graphic xlink:href="fmolb-09-1063620-g002.tif"/>
</fig>
<p>Results from a recent hydrogen/deuterium exchange (HDX) study on WT NQO1 (<xref ref-type="bibr" rid="B52">Vankova et al., 2019</xref>) enables us to evaluate the local stability of the protein segments in which these residues are found as well as the effect of FAD and dicoumarol binding (two ligands of functional and stability relevance) (<xref ref-type="fig" rid="F2">Figure 2C</xref>). The L7P, L7R and V9I substitutions are located in regions with high stability that do not change upon binding of FAD or dicoumarol (Dic; a competitive inhibitor of NADH). Variants G3S, G3D, A29T, K32N, G34V, E36K, S40L and H162N are located in regions with intermediate HDX stability and whose local stability is hardly sensitive to ligand binding. Nevertheless, these positions could still, in principle, affect protein folding, stability, or solubility and indirectly affect the binding of the substrates. M45L and M45I are found in a region with low stability and not responsive to ligand binding. Y20N is located in a region with intermediate stability and where HDX shows a response to ligand binding; the remaining six variants (T16M, I51V, W106R, W106C, F107C and M155I) are in regions with low stability and also their local stability respond directly to ligand binding. This last group of variants may thus have a greater potential to affect enzymatic activity [preventing either the formation of the &#x201c;stable&#x201d; holo-protein, a precatalytic state, or the formation of a catalytically relevant state, the Dic state, with FAD and the inhibitor Dic bound (<xref ref-type="bibr" rid="B2">Anoz-Carbonell et al., 2020</xref>)]. Although this suggestion is simple, it must be noted that regions of either high or low local stability may play roles in enzyme functional and allosteric response, and that local effects can propagate far from the perturbed site (due to ligand binding or amino acid substitutions) (<xref ref-type="bibr" rid="B24">Luque and Freire, 2000</xref>; <xref ref-type="bibr" rid="B25">Luque et al., 2002</xref>; <xref ref-type="bibr" rid="B35">Naganathan, 2019</xref>). Therefore, we next performed an experimental characterization of variant effects on protein stability and function and compared the results with our computational analyses.</p>
</sec>
<sec id="s3-3">
<title>3.3 Variant effects on the expression levels, solubility and stability of NQO1</title>
<p>We first experimentally analysed the effect of these 22 NQO1 variants on the expression levels and solubility of the protein (upon expression in <italic>E.coli</italic>) as well as their effects on thermal stability (<xref ref-type="sec" rid="s10">Supplementary Table S1</xref>; <xref ref-type="fig" rid="F3">Figures 3</xref>, <xref ref-type="fig" rid="F4">4</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Overall effects of gnomAD and COSMIC variations on the solubility/aggregation propensity and thermal stability of the NQO1 protein. <bold>(A&#x2013;C)</bold> Expression analyses of solubility/aggregation propensity of NQO1 variants in <italic>E.coli</italic> at 37<sup>o</sup>C. The total amount of NQO1 protein [T, <bold>(A)]</bold> as well as the ratio of soluble/total (S/T) protein <bold>(B)</bold> were determined from induced cells sonicated before (T) and after (S) centrifugation at 21,000&#xa0;<italic>g</italic>. The levels of NQO1 protein were determined by western-blotting (<xref ref-type="sec" rid="s10">Supplementary Figure S3</xref>). The amount of soluble protein (S) is calculated as the product of T and S/T and shown in <bold>(C)</bold>. Data are the mean &#xb1; s.d. from at least three independent expression experiments for each variant; <bold>(D)</bold> Thermal stability of NQO1 variants as holo-proteins. &#x394;<italic>T</italic>
<sub>m</sub> values correspond to the difference between a given variant and the WT protein. Data are the mean &#xb1; s.d. from three-six technical replicas. Small circles indicate the effects of individual variants and large circles (and corresponding errors) are those for each data set (mean &#xb1; s.d.). For reference, the values corresponding to WT NQO1 are shown in light grey. Variants are grouped in the gnomAD and COSMIC sets.</p>
</caption>
<graphic xlink:href="fmolb-09-1063620-g003.tif"/>
</fig>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Variant effects on thermal stability related to their location near the MMI or the bound FAD. <bold>(A)</bold> Experimental &#x394;<italic>T</italic>
<sub>m</sub> values for individual variants; <bold>(B&#x2013;D)</bold> Structural location of the FAD (black spheres) and the MMI (grey dots) <bold>(B)</bold> and mutated residues (colour scale according to their destabilizing effect) <bold>(C)</bold>. <bold>(D)</bold> shows an overlay of <bold>(B,C)</bold>. Note that two views rotated 90&#xb0; are shown. The structural model used for display was PDB code 2F1O (<xref ref-type="bibr" rid="B4">Asher et al., 2006</xref>). The residue W106 is highlighted in magenta due to the widely different effects of the W106R/W106C substitutions.</p>
</caption>
<graphic xlink:href="fmolb-09-1063620-g004.tif"/>
</fig>
<p>The analysis of the total (T) expression of the variants vs. WT NQO1 at 37&#xb0;C (<xref ref-type="fig" rid="F3">Figures 3A,B</xref>; <xref ref-type="sec" rid="s10">Supplementary Figure S3</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>) revealed that some variants (G3S, G3D, L7P, and V9I) showed higher total expression levels, in agreement with our previous report (<xref ref-type="bibr" rid="B39">Pacheco-Garc&#xed;a et al., 2020</xref>). This is likely the result of codon optimization used in the mutagenesis. Most of the variants showed relatively high expression levels, ranging from 25% to full WT levels, indicating that these variants mildly to moderately reduced total expression levels. The L7R, G34V, S40L, D41G, and D41Y variants showed extremely low expression levels, thus preventing further biophysical characterization. Interestingly, overall, no substantial differences were observed between the average effect of the gnomAD and COSMIC sets of variants.</p>
<p>We then determined the fraction of NQO1 existing as soluble protein (S/T ratios; <xref ref-type="fig" rid="F3">Figure 3B</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>). WT NQO1 showed a ratio of &#x223c;0.9 (<xref ref-type="sec" rid="s10">Supplementary Table S1</xref>; <xref ref-type="fig" rid="F3">Figure 3B</xref>). Again, although some variants showed much lower S/T ratios than WT NQO1, most of them showed values between 0.2 and the WT ratio. Only five variants showed lower S/T ratios than 0.15 (L7P, L7R, S40L, F107C and M155I). Expression under milder conditions (25&#xb0;C) did not allow for purification of enough protein of the L7P, L7R, S40L, and G34V variants for further biophysical characterization.</p>
<p>We used the product of total expression levels and S/T ratios (i.e. the S values) as a proxy to evaluate the overall effect of amino acid substitutions on NQO1 solubility/aggregation propensity when expressed at 37&#xb0;C (<xref ref-type="sec" rid="s10">Supplementary Table S1</xref>; <xref ref-type="fig" rid="F3">Figure 3C</xref>). Nine substitutions reduced the solubility below 20% of the WT protein (L7R, G34V, S40L, D41G, D41Y, M45I, W106R, F107C, and M155I).</p>
<p>Next, we determined the thermal stability of the remaining eighteen variants as holo-proteins (i.e. those that were expressed well as soluble proteins and were stable during purification) (<xref ref-type="fig" rid="F3">Figures 3D</xref>, <xref ref-type="fig" rid="F4">4</xref>, <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>). Nine variants showed a thermal stability close that of the WT protein (&#x394;<italic>T</italic>
<sub>m</sub> &#x2264; 2&#xb0;C; variants G3S, G3D, V9I, A29T, K32N, E36K, F107C, M155I, and H162N), whereas five variants decreased thermal stability by 2&#x2013;5&#xb0;C (variants T16M, M45L, M45I, I51V, and W106C) and four decreased the stability by 5&#x2013;10&#xb0;C (Y20N, D41G, D41Y, and W106R) (<xref ref-type="sec" rid="s10">Supplementary Table S1</xref>). Most of the variants that destabilized the holo-protein by more than 2&#xb0;C are found in the MMI or close to the FAD bound (<xref ref-type="fig" rid="F4">Figure 4</xref>). Here, we note that the reported <italic>T</italic>
<sub>m</sub> and &#x394;<italic>T</italic>
<sub>m</sub> values are &#x201c;apparent&#x201d; values that cannot be regarded as reporting effects on thermodynamic stability since thermal unfolding is irreversible and kinetically-controlled (<xref ref-type="bibr" rid="B44">Pey et al., 2004</xref>). The W106R and W106C variants show different effects, highlighting the importance of both the location and the chemical nature of the change. The effects of the two mutations at W106 were intriguing. Both substitutions are non-conservative changes at a residue in the active site with low solvent exposure and a low structural stability with strong ligand-dependent responsiveness based on HDX studies (<xref ref-type="bibr" rid="B52">Vankova et al., 2019</xref>). However, their effects are very different, with W106R causing a much larger decrease in stability than W106C.</p>
<p>To end this section, the observed effects pinpoint that some variants in both the COSMIC and gnomAD databases decrease solubility and thermal stability of NQO1, and overall the two groups do so to similar extents (<xref ref-type="fig" rid="F3">Figure 3</xref>); this observation was also seen in the computational predictions (<xref ref-type="fig" rid="F1">Figure 1</xref>).</p>
</sec>
<sec id="s3-4">
<title>3.4 FAD binding and the stability of the FAD binding site</title>
<p>Sixteen out of the eighteen variants that yielded good levels of soluble proteins were prepared as apo-proteins to determine their affinity for FAD by titrations monitored by tryptophan fluorescence (<xref ref-type="fig" rid="F5">Figures 5A</xref>, <xref ref-type="fig" rid="F6">6</xref>; <xref ref-type="sec" rid="s10">Supplementary Figure S4</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S2</xref>). The D41Y and D41G variants were too unstable to obtain apo-proteins in sufficient amounts and quality.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Overall effects of gnomAD and COSMIC mutations on the FAD binding affinity and the local stability of the FAD binding site (FBS). <bold>(A)</bold> Changes in apparent FAD binding free energies (&#x394;&#x394;G<sub>FAD</sub>) calculated from the difference of binding affinity between WT and a given variant from titrations. Errors are those from linear propagation; <bold>(B)</bold> Local stability of the TCS (next to the FBS) from proteolysis kinetics. Changes in local stability (&#x394;&#x394;G<sub>PROT</sub>) calculated from the difference of the second-order rate constant between WT and a given variant. Errors are those from linear propagation; For reference, the values corresponding to WT NQO1 are shown in light grey. Variants are grouped in the gnomAD and COSMIC sets.</p>
</caption>
<graphic xlink:href="fmolb-09-1063620-g005.tif"/>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Variant effects on the FAD binding affinity. <bold>(A)</bold> FAD binding affinity of each variant was determined by titrations of apo-proteins. At least two independent experiments were carried out for each variant and fitted using a single-type-of-independent binding sites to obtain <italic>K</italic>
<sub>d</sub> values (note the logarithmic scale of the <italic>y</italic>-axis). Errors are those fittings. These <italic>K</italic>
<sub>d</sub> values were used to calculate the binding free energy difference (&#x394;&#x394;G<sub>FAD</sub>) between a given variant and the WT protein (note that a positive value indicates lower affinity). <bold>(B&#x2013;D)</bold> Structural location of the FAD (black spheres) and the FBS (grey dots) <bold>(B)</bold> and mutated residues (colour scale according to their destabilizing effect on FAD binding) <bold>(C)</bold>. The residue W106 is highlighted in magenta due to the widely different effects of the W106R/W106C substitutions. <bold>(D)</bold> shows an overlay of <bold>(B,C)</bold>. Note that two views rotated 90&#xb0; are shown. The structural model used for display was PDB code 2F1O (<xref ref-type="bibr" rid="B4">Asher et al., 2006</xref>).</p>
</caption>
<graphic xlink:href="fmolb-09-1063620-g006.tif"/>
</fig>
<p>The G3S, G3D, V9I, K32N, E36K, M45L, M45I, W106C, and F107C variants showed less than a 0.5&#xa0;kcal mol<sup>&#x2212;1</sup> increase in FAD binding free energy (corresponding to less than a 2.5-fold increase in <italic>K</italic>
<sub>d</sub>). The Y20N and A29T variants showed a moderate decrease in binding affinity (between 3 and 5-fold higher <italic>K</italic>
<sub>d</sub>; thus, a change in FAD binding free energy of 0.5&#x2013;1.0&#xa0;kcal mol<sup>&#x2212;1</sup>). Five variants (T16M, I51V, W106R, M155I and H162N) markedly decreased the binding affinity for FAD (10&#x2013;500-fold increase in <italic>K</italic>
<sub>d</sub>; between 1 and 3.7&#xa0;kcal mol<sup>&#x2212;1</sup> decrease in binding free energy). Inspection of a structural model of NQO1 allows us to rationalize the effect of these substitutions due to their proximity to the bound FAD, with some exceptions. For instance, the W106R, W106C and F107C substitutions are in proximity to the FAD molecule, but have widely different effects (from ca. 500-fold lower affinity in W106R, to WT-like affinity for W106C and even <italic>higher</italic> affinity than WT for F107C). These results show that NQO1 responds to natural variations very differently even at the same site (i.e. two highly non-conservative variants at the site W106).</p>
<p>Mutational effects on FAD binding affinity (&#x394;&#x394;G<sub>FAD</sub>) and proteolysis rates (&#x394;&#x394;G<sub>PROT</sub>) with thermolysin have previously been shown to correlate well (<xref ref-type="bibr" rid="B32">Medina-Carmona et al., 2017a</xref>; <xref ref-type="bibr" rid="B34">Medina-Carmona et al., 2019b</xref>; <xref ref-type="bibr" rid="B39">Pacheco-Garc&#xed;a et al., 2020</xref>). The site for initial cleavage by thermolysin (TCS) is generally between Ser72&#x2013;Val73, close to the FAD binding site (<xref ref-type="bibr" rid="B33">Medina-Carmona et al., 2016</xref>). All the variants investigated showed proteolysis patterns that were similar to that of WT NQO1 (<xref ref-type="sec" rid="s10">Supplementary Figure S5</xref>). The previously observed correlation between &#x394;&#x394;G<sub>FAD</sub> and &#x394;&#x394;G<sub>PROT</sub> holds for the 16 variants for which both FAD binding affinity and protease sensitivity can be compared (<xref ref-type="sec" rid="s10">Supplementary Figure S6</xref>). The T16M, I51V, W106C, and M155I mutations destabilized locally the TCS by 1&#x2013;2.5&#xa0;kcal mol<sup>&#x2212;1</sup> and the residues affected by these substitutions are in general close to the TCS (with the exception of M155I, the most destabilizing mutation) (<xref ref-type="fig" rid="F7">Figure 7</xref>). Again, the results for the W106R/C variants were very different: both affected the local stability by &#x223c; 1&#xa0;kcal mol<sup>&#x2212;1</sup>, but with opposite signs (<xref ref-type="sec" rid="s10">Supplementary Table S2</xref>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Variant effects on the local stability of the FBS from proteolysis. <bold>(A)</bold> Second-order rate constants for proteolysis of NQO1 variants (<xref ref-type="sec" rid="s10">Supplementary Figure S5C</xref>). Errors are those fittings. These <italic>k</italic>
<sub>PROT</sub> values were used to calculate the TCS local energy free difference (&#x394;&#x394;G<sub>PROT</sub>) between a given variant and the WT protein (note that a positive value indicates lower affinity). <bold>(B,C)</bold> Structural location of the FAD (black spheres) and the TCS (blue spheres) <bold>(B)</bold>. In <bold>(C)</bold>, mutated residues (colour scale according to their destabilizing effect on FAD binding) <bold>(C)</bold> are overlayed with TCS and FAD. The residues D41 and W106 are highlighted in magenta due to the widely different effects of the D41G/D41Y and W106R/W106C substitutions. Note that two views rotated 90&#xb0; are shown. The structural model used for display was PDB code 2F1O (<xref ref-type="bibr" rid="B4">Asher et al., 2006</xref>).</p>
</caption>
<graphic xlink:href="fmolb-09-1063620-g007.tif"/>
</fig>
<p>Overall, the negative impact on FAD binding affinity and the stability of the FAD binding site in the holo-state was similar between variants from COSMIC and gnomAD sets (<xref ref-type="fig" rid="F5">Figure 5</xref>).</p>
</sec>
<sec id="s3-5">
<title>3.5 Comparison of experimental analyses and computational predictions</title>
<p>We then proceeded to compare the experimental data to each other and to computational predictions. To ease comparison between the calculated &#x394;&#x394;G values and thermal melting measurements, we first estimated &#x394;&#x394;G<sub>melting</sub> from the &#x394;<italic>T</italic>
<sub>m</sub> values using an empirical relationship (<xref ref-type="bibr" rid="B53">Watson et al., 2018</xref>), again noting that these are not strictly experimental thermodynamic values as unfolding is not reversible either by temperature (<xref ref-type="bibr" rid="B44">Pey et al., 2004</xref>) or chemical denaturants (<xref ref-type="fig" rid="F7">Figure S7</xref>). We first compared the experimental values of &#x394;&#x394;G<sub>melting</sub> to the levels of soluble protein (S values, <xref ref-type="fig" rid="F8">Figure 8A</xref>). We found that unstable variants (those with &#x394;&#x394;G<sub>melting</sub> &#x3e; 2&#xa0;kcal mol<sup>&#x2212;1</sup> or not amenable for purification, not-determined or ND) mostly showed level of S close to zero (&#x3c;5) except for L7P. Stable variants (here defined as &#x394;&#x394;G<sub>melting</sub> &#x3c; 2&#xa0;kcal mol<sup>&#x2212;1</sup>) instead showed a wide range of S values (76 &#xb1; 85%; mean &#xb1; s.d.).</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Comparison of experimental results with computational scores. <bold>(A)</bold> Scatter plot of &#x394;&#x394;G<sub>melting</sub> (<italic>x</italic>-axis) and S values (expression &#x2a; solubility). Not-determined variants (ND) in thermal stability experiment are reported in a separate plot. <bold>(B,C)</bold> show a comparison between &#x394;&#x394;G<sub>melting</sub> and computational predictors. <bold>(D)</bold> Correlation between &#x394;&#x394;G<sub>melting</sub> and &#x394;&#x394;G<sub>FAD</sub> for NQO1 variants detected in both the experiments. <bold>(E,F)</bold> Comparison of &#x394;&#x394;G<sub>FAD</sub> with the computational results. Red lines, if present, show the boundary of experimental and computational classes for each comparison. In each panel errors are reported as a black bar on every single variant, if present.</p>
</caption>
<graphic xlink:href="fmolb-09-1063620-g008.tif"/>
</fig>
<p>We next compared &#x394;&#x394;G<sub>melting</sub> with the computational scores (<xref ref-type="fig" rid="F8">Figures 8B,C</xref>). Overall, we found a good agreement for most of the unstable and Not-Determined (ND) variants, which showed &#x394;&#x394;G &#x3e;2.0&#xa0;kcal mol<sup>&#x2212;1</sup> and evolutionary distance, &#x394;E &#x3c; &#x2212;3 indicating predicted loss of stability and function. The only exception was D41Y which displayed a stabilizing behaviour in Rosetta &#x394;&#x394;G predictions. Experimentally stable variants (&#x394;&#x394;G<sub>melting</sub> &#x3c; 2&#xa0;kcal mol<sup>&#x2212;1</sup>) displayed low evolutionary distances (&#x394;E &#x3e; &#x2212;2.5&#xa0;kcal mol<sup>&#x2212;1</sup>) except for W106C and T16M. This observation for T16M supports the notion that detrimental effects on protein function may not be connected to thermodynamic destabilization for this variant (<xref ref-type="bibr" rid="B39">Pacheco-Garc&#xed;a et al., 2020</xref>).</p>
<p>We then compared &#x394;&#x394;G<sub>FAD</sub> with the other experimental and computational observables (<xref ref-type="fig" rid="F8">Figures 8D&#x2013;F</xref>). For most (15 out of 16) of the variants where &#x394;&#x394;G<sub>FAD</sub> could be measured, the &#x394;&#x394;G<sub>melting</sub> was &#x3c;2&#xa0;kcal mol<sup>&#x2212;1</sup>, indicating stable variants which was also confirmed by Rosetta &#x394;&#x394;G calculations (13 out of 16 substitutions). Seven of the fifteen variants showed a &#x394;&#x394;G<sub>FAD</sub> &#x3e; 0.5&#xa0;kcal mol<sup>&#x2212;1</sup> indicating loss of function. Of these, three variants were captured by evolutionary conservation analysis (&#x394;E &#x3c; &#x2212;2.5&#xa0;kcal mol<sup>&#x2212;1</sup>).</p>
<p>To summarize, for 14 out of 22 tested variants (G3S L7P L7D V9I T16M Y20N K32N G34V E36K D41G M45L M45I W106R, M155I) the predictions from the computational protocols match the experimental results, in terms of variant effects on protein stability and function.</p>
<p>While the results are overall encouraging, there remains differences between computation and experiments for the effects of some mutations (eight out of twenty-two; G3D, A29T, S40L, D41Y, I51V, W106C, F107C, and H162N). For five of these (G3D, S40L, D41Y, W106C, and F107C) it appears that there is a difference between the stability prediction by Rosetta and experiments (noting again that the latter are not equilibrium measurements). For the partially exposed S40L and D41Y the reason for the discrepancy is perhaps related to specific interactions made by these two residues whose effects are not captured by the Rosetta calculations. Both W106C and F107C involve substituting aromatic residues with a cysteine, suggesting problems with evaluating such substitutions. In other two cases (G3D, A29T, and H162N) the GEMME scores did not capture properly the variant effects, possibly because some specific interactions in human NQO1 may not be present in other homologs of NQO1 and thus, not captured by the evolutionary analysis. Lastly, for I51V the behaviour is opposite from both computational predictions.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<p>With advances in sequencing technologies, we are uncovering the large genetic variability in the <italic>human genome</italic>. To exploit the availability of this information at the clinical level, we must be able to establish genotype-phenotype correlations accurately and at a large-scale. Although detailed characterization of mutational effects is obviously useful, it is difficult to perform this at such scale (many genes, many variants). However, we may use experimental characterization on a more modest scale to test the performance of current predictive tools in the hope that we can improve them. In this work, we have carried out such an exercise for the human NQO1 protein. The rationale for selecting this system is three-fold: 1) human NQO1 is a multifunctional protein and mutational effects may affect these functions through complex mechanisms (<xref ref-type="bibr" rid="B37">Pacheco-Garcia et al., 2022a</xref>; <xref ref-type="bibr" rid="B40">Pacheco-Garcia et al., 2022b</xref>). Therefore, contrasting experimental characterization and computational predictions can be challenging for current predictive tools and may help to improve them; 2) Altered NQO1 functionality is associated with increased risk of developing cancer and neurological disorders (<xref ref-type="bibr" rid="B48">Salido et al., 2022</xref>). Indeed, the presence of a highly deleterious polymorphic variant in NQO1 is associated with increased cancer risk and affects multiple protein functions through allosteric effects (<xref ref-type="bibr" rid="B19">Lajin and Alachkar, 2013</xref>; <xref ref-type="bibr" rid="B40">Pacheco-Garcia et al., 2022b</xref>); 3) Over a hundred of missense variants in human NQO1 have been found in human population (i.e. the gnomAD database) or in cancer cell lines as somatic mutations (i.e. the COSMIC database). However, the impact of these mutations on NQO1 multifunctionality and their potential role in cancer development are largely unexplored.</p>
<p>Theoretical advances and new methodologies in the fields of sequence evolution and structure predictions allow us to perform large-scale <italic>in silico</italic> mutagenesis studies on target proteins. Although the current state-of-art algorithms are often [but not always (<xref ref-type="bibr" rid="B11">Frazer et al., 2021</xref>)] less accurate at predicting pathogenicity compared to detailed experimental testing, they provide a fast and effective way to predict LoF and sometimes to generate mechanistic hypotheses regarding which properties a variant might affect (<xref ref-type="bibr" rid="B50">Stein et al., 2019</xref>; <xref ref-type="bibr" rid="B8">Cagiada et al., 2021</xref>).</p>
<p>Here, we first performed <italic>in silico</italic> saturation mutagenesis of WT NQO1, predicting the changes in thermodynamic stability (&#x394;&#x394;G) and evolutionary conservation (&#x394;E) for 5,187 variants. We combined the two scores to perform a global analysis on how the NQO1 function may be perturbed. Approximately 44% of variants are predicted to cause LoF, with 45% of these drastically affecting the protein stability. This analysis enabled us to obtain an overview on the possible biologically relevant positions and variants. Indeed, although we know that the ability of computational tools to assign biological functions and predict overall pathogenicity is rapidly increasing, we are still at a point where computational methods may not predict LoF perfectly, and often do not shed much light on the mechanisms of action. This might in particular hold for proteins like NQO1 where multiple biological functions are present, and where some of which may differ between orthologues.</p>
<p>We then used the information provided from the <italic>in silico</italic> saturation mutagenesis to select 22 naturally-occurring variants with a diverse range of predicted effects on protein stability and function to be experimentally tested. We selected nine mutations found in COSMIC and thirteen from gnomAD. Of these variants, 36% severely affected protein foldability and solubility (upon expression in <italic>E.coli</italic>) or reduced conformational stability (at least a 5&#xb0;C decrease in <italic>T</italic>
<sub>m</sub>). A quarter of the variants had severely affected FAD binding (a 5-fold decrease in affinity, i.e. a 1&#xa0;kcal mol<sup>&#x2212;1</sup> of binding free energy penalization). For 64% of the variants, experimental characterization and computational predictions agreed in the variant effects on protein stability and function, whereas the remaining 36% of the mutations might be explained by limitations known for the tools used in the prediction process. Although, at this point, this level of agreement is reasonable, it also pinpoints the necessity of improving these predictive tools.</p>
<p>COSMIC mutations are in general somatic (actually, 86% of the COSMIC mutations of NQO1 are labelled as <italic>confirmed</italic> in this database; accessed by 17 August 2022) and likely come from samples that underwent many mutational events in different genes. Thus, the identification of a mutation in the COSMIC database does not imply that this mutation is a driver mutation [here we may define a driver mutation as a mutation with the ability to drive tumorigenesis and confer selective advantages in a tumor cell and a somatic tissue (<xref ref-type="bibr" rid="B26">Mart&#xed;nez-Jim&#xe9;nez et al., 2020</xref>)]. Mutations in the gnomAD database belong to heterogeneous groups (many different sequencing projects, some of them case-control studies), and likely reflect genetic variability in the <italic>germline</italic> and in general presence or absence in gnomAD is not sufficient to assign a label as pathogenic or benign. When we examine the NQO1 variants investigated in this work found in the gnomAD database (v.2.1), allele frequencies are overall comparable in <italic>control</italic> vs. <italic>all</italic> samples (<xref ref-type="sec" rid="s10">Supplementary Table S3</xref>). This suggests that there is no strong bias towards <italic>case</italic> samples, and thus the allele frequencies in gnomAD may represent well their presence in a <italic>healthy</italic> population. The presence of these mutations in the germline may predispose somatic cells towards a new mutational event in the WT allele [as occurs in familial cancer cases (<xref ref-type="bibr" rid="B26">Mart&#xed;nez-Jim&#xe9;nez et al., 2020</xref>)], thus largely decreasing the NQO1 activity and function.</p>
<p>Our combined experimental and computational analyses provide information on the potential LoF character and the mechanisms by which the variants may exert their effects (protein stability and/or function). Due to its role in the antioxidant defense and stabilization of oncosuppressor proteins, it is likely that NQO1 play a role in cancer development. Homozygous NQO1 knock-out mice revealed cancer-associated phenotypic traits when exposed to chemical or radiological insults (<xref ref-type="bibr" rid="B45">Radjendirane et al., 1998</xref>; <xref ref-type="bibr" rid="B22">Long et al., 2000</xref>; <xref ref-type="bibr" rid="B15">Iskander et al., 2005</xref>; <xref ref-type="bibr" rid="B14">Iskander et al., 2008</xref>). Thus, the presence of LoF variants in NQO1 and increased cancer risk may resemble a recessive inheritance (<xref ref-type="bibr" rid="B19">Lajin and Alachkar, 2013</xref>). The p.P187S polymorphism (with an allele frequency of &#x223c;0.25, <xref ref-type="sec" rid="s10">Supplementary Table S3</xref>) dramatically decreases the intracellular stability of NQO1 thus preventing its interaction with oncosuppressors, reducing enzyme activity and affecting almost the entire structure of NQO1 (<xref ref-type="bibr" rid="B38">Pacheco-Garcia et al., 2021</xref>). Noteworthy, it only associates with cancer in homozygotes (<xref ref-type="bibr" rid="B19">Lajin and Alachkar, 2013</xref>). Due to the low frequency of most gnomAD NQO1 variants, their presence would be rare even in compound heterozygotes. In fact, 98% of the homozygous samples containing NQO1 missense variations correspond to homozygotes for P187S. However, an additional (<italic>somatic</italic>) mutational event in a WT/P187S genetic background (about 25% of human population) may substantially enhance the LOF phenotype in this common genetic background.</p>
<p>To conclude, we present a test of predictive tools against the experimental characterization of large set of naturally-occurring mutations on NQO1 stability and function. Further steps will be taken to provide a wider perspective on the multifunctionality of NQO1 (i.e. intracellular degradation and stability, high-resolution structural stability in different ligation states, enzyme function and cooperativity, interaction with protein partners, allosteric communication of mutational effects) and the relationships between the genetic diversity of NQO1 in human population and its link with individual propensity towards disease development.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>AP conceived the project and supervised the experimental work; JP-G and KT-M carried out expression, purification and characterization of proteins; MC carried out computational analysis; ES contributed to selection of variants and contributed with reagents; KL-L supervised the computational work; KL-L and AP received funding; M.C, KL-L and AP wrote the original draft; All authors contributed to and approved the final version of the manuscript.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This work was supported by the ERDF/Spanish Ministry of Science, Innovation and Universities&#x2014;State Research Agency (Grant Number. RTI 2018-096246-B-I00), Consejer&#xed;a de Econom&#xed;a, Conocimiento, Empresas y Universidad, Junta de Andaluc&#xed;a (Grant Number. P18-RT-2413), ERDF/Counseling of Economic transformation, Industry, Knowledge and Universities (Grant B-BIO-84-UGR20) and Comunidad Valenciana (Grant Number. CIAICO/2021/135). This work is a contribution from the PRISM (Protein Interactions and Stability in Medicine and Genomics) centre funded by the Novo Nordisk Foundation (to KL-L; NNF18OC0033950).</p>
</sec>
<ack>
<p>MC and KL-L acknowledge access to computational resources the Biocomputing Core Facility at the Department of Biology, University of Copenhagen.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmolb.2022.1063620/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmolb.2022.1063620/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Presentation1.zip" id="SM1" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table1.DOCX" id="SM2" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table2.DOCX" id="SM3" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table3.DOCX" id="SM4" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.XLSX" id="SM5" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet2.XLSX" id="SM6" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<sec id="s11">
<title>Abbreviations</title>
<p>CTD, C-terminal domain; COSMIC, Catalogue Of Somatic Mutations In Cancer cell lines database; Dic, dicoumarol; FAD, Flavin adenine dinucleotide; GEMME: Global Epistatic Model for predicting Mutational Effects; gnomAD, Genome Aggregation Database; HDX, hydrogen/deuterium exchange; HEPES, 2-[4-(2-hydroxyethyl)piperazin-1-yl]ethanesulfonic acid; IMAC, Immobilized metal affinity chromatography; <italic>K</italic>
<sub>d</sub>, apparent dissociation constant; <italic>k</italic>
<sub>obs</sub>, observed rate constant for proteolysis; <italic>k</italic>
<sub>prot</sub>, second-order rate constant for proteolysis; LoF, Loss-of-function; MMI, monomer:monomer interface; MSA, multiple sequence alignment; NTD, N-terminal domain; NQO1, NAD(P)H:quinone oxidoreductase 1; S, soluble protein levels; SASA, solvent accessible surface area; SDS-PAGE, polyacrylamide gel electrophoresis in the presence of sodium dodecylsulphate; S/T, Soluble/Total ratio of NQO1 protein; <italic>T</italic>
<sub>m</sub>, apparent half-denaturation temperature; WT, wild-type; &#x394;<italic>E</italic>, Normalized predicted effect of an amino acid substitution from the GEMME model; &#x394;&#x394;<italic>G</italic>, computationally calculated change in unfolding Gibbs free energy between a variant and the WT protein; &#x394;&#x394;<italic>G</italic>
<sub>FAD</sub>, difference in binding Gibbs free energy between a variant and the WT protein; &#x394;&#x394;<italic>G</italic>
<sub>melting</sub>, operational metric for the estimation of the unfolding Gibbs free energy changes between a variant and the WT protein from &#x394;<italic>T</italic>
<sub>m</sub>; &#x394;&#x394;<italic>G</italic>
<sub>PROT</sub>, difference in free energy of cleavable and non-cleavable states for proteolysis between a variant and the WT protein; &#x394;<italic>T</italic>
<sub>m</sub>, difference in <italic>T</italic>
<sub>m</sub> between a variant and the WT protein.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abildgaard</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Stein</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nielsen</surname>
<given-names>S. V.</given-names>
</name>
<name>
<surname>Schultz-Knudsen</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Papaleo</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Shrikhande</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Computational and cellular studies reveal structural destabilization and degradation of MLH1 variants in Lynch syndrome</article-title>. <source>Elife</source> <volume>8</volume>, <fpage>e49138</fpage>. <pub-id pub-id-type="doi">10.7554/eLife.49138</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anoz-Carbonell</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Timson</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Pey</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Medina</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The catalytic cycle of the antioxidant and cancer-associated human NQO1 enzyme: Hydride transfer, conformational dynamics and functional cooperativity</article-title>. <source>Antioxidants</source> <volume>9</volume>, <fpage>772</fpage>. <pub-id pub-id-type="doi">10.3390/antiox9090772</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arnedo-Pac</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lopez-Bigas</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Mui&#xf1;os</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Predicting disease variants using biodiversity and machine learning</article-title>. <source>Nat. Biotechnol.</source> <volume>40</volume>, <fpage>27</fpage>&#x2013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-021-01187-w</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Asher</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Dym</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Tsvetkov</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Adler</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Shaul</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>The crystal structure of NAD(P)H quinone oxidoreductase 1 in complex with its potent inhibitor dicoumarol</article-title>. <source>Biochemistry</source> <volume>45</volume>, <fpage>6372</fpage>&#x2013;<lpage>6378</lpage>. <pub-id pub-id-type="doi">10.1021/bi0600087</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Asher</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Tsvetkov</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kahana</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Shaul</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>A mechanism of ubiquitin-independent proteasomal degradation of the tumor suppressors p53 and p73</article-title>. <source>Genes Dev.</source> <volume>19</volume>, <fpage>316</fpage>&#x2013;<lpage>321</lpage>. <pub-id pub-id-type="doi">10.1101/gad.319905</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beaver</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Mesa-Torres</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Pey</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Timson</surname>
<given-names>D. J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>NQO1: A target for the treatment of cancer and neurological diseases, and a model to understand loss of function disease mechanisms</article-title>. <source>Biochim. Biophys. Acta. Proteins Proteom.</source> <volume>1867</volume>, <fpage>663</fpage>&#x2013;<lpage>676</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbapap.2019.05.002</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ben-Nissan</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Sharon</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Regulating the 20S proteasome ubiquitin-independent degradation pathway</article-title>. <source>Biomolecules</source> <volume>4</volume>, <fpage>862</fpage>&#x2013;<lpage>884</lpage>. <pub-id pub-id-type="doi">10.3390/biom4030862</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cagiada</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Johansson</surname>
<given-names>K. E.</given-names>
</name>
<name>
<surname>Valanciute</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nielsen</surname>
<given-names>S. V.</given-names>
</name>
<name>
<surname>Hartmann-Petersen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J. J.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Understanding the origins of loss of protein function by analyzing the effects of thousands of variants on activity and abundance</article-title>. <source>Mol. Biol. Evol.</source> <volume>38</volume>, <fpage>3235</fpage>&#x2013;<lpage>3246</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msab095</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>di Francesco</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>di Germanio</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Panda</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Huynh</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Peaden</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Navas-Enamorado</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Novel RNA-binding activity of NQO1 promotes SERPINA1 mRNA translation</article-title>. <source>Free Radic. Biol. Med.</source> <volume>99</volume>, <fpage>225</fpage>&#x2013;<lpage>233</lpage>. <pub-id pub-id-type="doi">10.1016/j.freeradbiomed.2016.08.005</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Faig</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bianchet</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Talalay</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Winski</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ross</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2000</year>). <article-title>Structures of recombinant human and mouse NAD(P)H:quinone oxidoreductases: Species comparison and structural changes with substrate binding and release</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>97</volume>, <fpage>3177</fpage>&#x2013;<lpage>3182</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.050585797</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Frazer</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Notin</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dias</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gomez</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Min</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Brock</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Disease variant prediction with deep generative models of evolutionary data</article-title>. <source>Nature</source> <volume>599</volume>, <fpage>91</fpage>&#x2013;<lpage>95</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-021-04043-8</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Frenz</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Lewis</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>DiMaio</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Prediction of protein mutational free energy: Benchmark and sampling improvements increase classification accuracy</article-title>. <source>Front. Bioeng. Biotechnol.</source> <volume>8</volume>, <fpage>558247</fpage>. <pub-id pub-id-type="doi">10.3389/fbioe.2020.558247</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>H&#xf8;ie</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Cagiada</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Beck Frederiksen</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Stein</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lindorff-Larsen</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Predicting and interpreting large-scale mutagenesis data using analyses of protein stability and conservation</article-title>. <source>Cell Rep.</source> <volume>38</volume>, <fpage>110207</fpage>. <pub-id pub-id-type="doi">10.1016/j.celrep.2021.110207</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iskander</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Barrios</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Jaiswal</surname>
<given-names>A. K.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Disruption of NAD(P)H:quinone oxidoreductase 1 gene in mice leads to radiation-induced myeloproliferative disease</article-title>. <source>Cancer Res.</source> <volume>68</volume>, <fpage>7915</fpage>&#x2013;<lpage>7922</lpage>. <pub-id pub-id-type="doi">10.1158/0008-5472.CAN-08-0766</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iskander</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Gaikwad</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Paquet</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Brayton</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Barrios</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Lower induction of p53 and decreased apoptosis in NQO1-null mice lead to increased sensitivity to chemical-induced skin carcinogenesis</article-title>. <source>Cancer Res.</source> <volume>65</volume>, <fpage>2054</fpage>&#x2013;<lpage>2058</lpage>. <pub-id pub-id-type="doi">10.1158/0008-5472.CAN-04-3157</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kabsch</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Sander</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>1983</year>). <article-title>Dictionary of protein secondary structure: Pattern recognition of hydrogen-bonded and geometrical features</article-title>. <source>Biopolymers</source> <volume>22</volume>, <fpage>2577</fpage>&#x2013;<lpage>2637</lpage>. <pub-id pub-id-type="doi">10.1002/bip.360221211</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Katsonis</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wilhelm</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lichtarge</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Genome interpretation using <italic>in silico</italic> predictors of variant impact</article-title>. <source>Hum. Genet.</source> <volume>141</volume>, <fpage>1549</fpage>&#x2013;<lpage>1577</lpage>. <pub-id pub-id-type="doi">10.1007/s00439-022-02457-6</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Laine</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Karami</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Carbone</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Gemme: A simple and fast global epistatic model predicting mutational effects</article-title>. <source>Mol. Biol. Evol.</source> <volume>36</volume>, <fpage>2604</fpage>&#x2013;<lpage>2619</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msz179</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lajin</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Alachkar</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>The NQO1 polymorphism C609T (Pro187Ser) and cancer susceptibility: A comprehensive meta-analysis</article-title>. <source>Br. J. Cancer</source> <volume>109</volume>, <fpage>1325</fpage>&#x2013;<lpage>1337</lpage>. <pub-id pub-id-type="doi">10.1038/bjc.2013.357</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bianchet</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Talalayt</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Amzel</surname>
<given-names>L. M.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>The three-dimensional structure of NAD(P)H:quinone reductase, a flavoprotein involved in cancer chemoprotection and chemotherapy: Mechanism of the two-electron reduction</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>92</volume>, <fpage>8846</fpage>&#x2013;<lpage>8850</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.92.19.8846</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lienhart</surname>
<given-names>W. D.</given-names>
</name>
<name>
<surname>Gudipati</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Uhl</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Binter</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pulido</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Saf</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Collapse of the native structure caused by a single amino acid exchange in human NAD(P)H:Quinone oxidoreductase</article-title>. <source>FEBS J.</source> <volume>281</volume>, <fpage>4691</fpage>&#x2013;<lpage>4704</lpage>. <pub-id pub-id-type="doi">10.1111/febs.12975</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Long</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Waikel</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X. J.</given-names>
</name>
<name>
<surname>Perlaky</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Roop</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Jaiswal</surname>
<given-names>A. K.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>NAD(P)H:quinone oxidoreductase 1 deficiency increases susceptibility to benzo(a)pyrene-induced mouse skin carcinogenesis</article-title>. <source>Cancer Res.</source> <volume>60</volume>, <fpage>5913</fpage>&#x2013;<lpage>5915</lpage>.</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z. H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Day</surname>
<given-names>J. X.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Akt phosphorylates NQO1 and triggers its degradation, abolishing its antioxidative activities in Parkinson&#x2019;s disease</article-title>. <source>J. Neurosci.</source> <volume>39</volume>, <fpage>7291</fpage>&#x2013;<lpage>7305</lpage>. <pub-id pub-id-type="doi">10.1523/JNEUROSCI.0625-19.2019</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luque</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Freire</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Structural stability of binding sites: Consequences for binding affinity and allosteric effects</article-title>. <source>Proteins</source> <volume>4</volume>, <fpage>63</fpage>&#x2013;<lpage>71</lpage>. <pub-id pub-id-type="doi">10.1002/1097-0134(2000)41:4&#x2b;&#x3c;63::aid-prot60&#x3e;3.3.co;2-y</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luque</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Leavitt</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Freire</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>The linkage between protein folding and functional cooperativity: Two sides of the same coin?</article-title> <source>Annu. Rev. Biophys. Biomol. Struct.</source> <volume>31</volume>, <fpage>235</fpage>&#x2013;<lpage>256</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.biophys.31.082901.134215</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mart&#xed;nez-Jim&#xe9;nez</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Mui&#xf1;os</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Sent&#xed;s</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Deu-Pons</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Reyes-Salazar</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Arnedo-Pac</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A compendium of mutational cancer driver genes</article-title>. <source>Nat. Rev. Cancer</source> <volume>20</volume>, <fpage>555</fpage>&#x2013;<lpage>572</lpage>. <pub-id pub-id-type="doi">10.1038/s41568-020-0290-x</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mart&#xed;nez-Lim&#xf3;n</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Alriquet</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lang</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Calloni</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Wittig</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Vabulas</surname>
<given-names>R. M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Recognition of enzymes lacking bound cofactor by Protein quality control</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>113</volume>, <fpage>12156</fpage>&#x2013;<lpage>12161</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1611994113</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mart&#xed;nez-Lim&#xf3;n</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Calloni</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Ernst</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Vabulas</surname>
<given-names>R. M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Flavin dependency undermines proteome stability, lipid metabolism and cellular proliferation during vitamin B2 deficiency</article-title>. <source>Cell Death Dis.</source> <volume>11</volume>, <fpage>725</fpage>. <pub-id pub-id-type="doi">10.1038/s41419-020-02929-5</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McInnes</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Sharo</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>Koleske</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>J. E. H.</given-names>
</name>
<name>
<surname>Norstad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Adhikari</surname>
<given-names>A. N.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Opportunities and challenges for the computational interpretation of rare variation in clinically important genes</article-title>. <source>Am. J. Hum. Genet.</source> <volume>108</volume>, <fpage>535</fpage>&#x2013;<lpage>548</lpage>. <pub-id pub-id-type="doi">10.1016/j.ajhg.2021.03.003</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Medina-Carmona</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Betancor-Fern&#xe1;ndez</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Santos</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mesa-Torres</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Grottelli</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Batlle</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Insight into the specificity and severity of pathogenic mechanisms associated with missense mutations through experimental and structural perturbation analyses</article-title>. <source>Hum. Mol. Genet.</source> <volume>28</volume>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1093/hmg/ddy323</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Medina-Carmona</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Fuchs</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Gavira</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Mesa-Torres</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Neira</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Salido</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Enhanced vulnerability of human proteins towards disease-associated inactivation through divergent evolution</article-title>. <source>Hum. Mol. Genet.</source> <volume>26</volume>, <fpage>3531</fpage>&#x2013;<lpage>3544</lpage>. <pub-id pub-id-type="doi">10.1093/hmg/ddx238</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Medina-Carmona</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Neira</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Salido</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Fuchs</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Palomino-Morales</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Timson</surname>
<given-names>D. J.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Site-to-site interdomain communication may mediate different loss-of-function mechanisms in a cancer-associated NQO1 polymorphism</article-title>. <source>Sci. Rep.</source> <volume>7</volume>, <fpage>44532</fpage>. <pub-id pub-id-type="doi">10.1038/srep44532</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Medina-Carmona</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Palomino-Morales</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Fuchs</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Pad&#xed;n-Gonzalez</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mesa-Torres</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Salido</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Erratum: Conformational dynamics is key to understanding loss-of-function of NQO1 cancer-associated polymorphisms and its correction by pharmacological ligands</article-title>. <source>Sci. Rep.</source> <volume>6</volume> (<issue>1</issue>), <fpage>21939</fpage>. <pub-id pub-id-type="doi">10.1038/srep21939</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Medina-Carmona</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Rizzuti</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Mart&#xed;n-Escolano</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Pacheco-Garc&#xed;a</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Mesa-Torres</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Neira</surname>
<given-names>J. L.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Phosphorylation compromises FAD binding and intracellular stability of wild-type and cancer-associated NQO1: Insights into flavo-proteome stability</article-title>. <source>Int. J. Biol. Macromol.</source> <volume>125</volume>, <fpage>1275</fpage>&#x2013;<lpage>1288</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijbiomac.2018.09.108</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Naganathan</surname>
<given-names>A. N.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Modulation of allosteric coupling by mutations: From protein dynamics and packing to altered native ensembles and function</article-title>. <source>Curr. Opin. Struct. Biol.</source> <volume>54</volume>, <fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.sbi.2018.09.004</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oh</surname>
<given-names>E. T.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>J. W.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>S. S.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>NQO1 inhibits proteasome-mediated degradation of HIF-1&#x3b1;</article-title>. <source>Nat. Commun.</source> <volume>7</volume>, <fpage>13593</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms13593</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pacheco-Garcia</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Anoz-Carbonell</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Loginov</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Vankova</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Salido</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Man</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Different phenotypic outcome due to site-specific phosphorylation in the cancer-associated NQO1 enzyme studied by phosphomimetic mutations</article-title>. <source>Arch. Biochem. Biophys.</source> <volume>729</volume>, <fpage>109392</fpage>. <pub-id pub-id-type="doi">10.1016/j.abb.2022.109392</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pacheco-Garcia</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Anoz-Carbonell</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Vankova</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kannan</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Palomino-Morales</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mesa-Torres</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Structural basis of the pleiotropic and specific phenotypic consequences of missense mutations in the multifunctional NAD(P)H:quinone oxidoreductase 1 and their pharmacological rescue</article-title>. <source>Redox Biol.</source> <volume>46</volume>, <fpage>102112</fpage>. <pub-id pub-id-type="doi">10.1016/j.redox.2021.102112</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pacheco-Garc&#xed;a</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Cano-Mu&#xf1;oz</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>S&#xe1;nchez-Ramos</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Salido</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Pey</surname>
<given-names>A. L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Naturally-occurring rare mutations cause mild to catastrophic effects in the multifunctional and cancer-associated NQO1 protein</article-title>. <source>J. Pers. Med.</source> <volume>10</volume>, <fpage>E207</fpage>&#x2013;<lpage>E231</lpage>. <pub-id pub-id-type="doi">10.3390/jpm10040207</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pacheco-Garcia</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Loginov</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Anoz-Carbonell</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Vankova</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Palomino-Morales</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Salido</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Allosteric communication in the multifunctional and redox NQO1 protein studied by cavity-making mutations</article-title>. <source>Antioxidants</source> <volume>11</volume>, <fpage>1110</fpage>. <pub-id pub-id-type="doi">10.3390/antiox11061110</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Park</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Marqusee</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Probing the high energy states in proteins by proteolysis</article-title>. <source>J. Mol. Biol.</source> <volume>343</volume>, <fpage>1467</fpage>&#x2013;<lpage>1476</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2004.08.085</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Park</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bradley</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Greisen</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mulligan</surname>
<given-names>V. K.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>D. E.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Simultaneous optimization of biomolecular energy functions on features from small molecules and macromolecules</article-title>. <source>J. Chem. Theory Comput.</source> <volume>12</volume>, <fpage>6201</fpage>&#x2013;<lpage>6212</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jctc.6b00819</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pey</surname>
<given-names>A. L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Biophysical and functional perturbation analyses at cancer-associated P187 and K240 sites of the multifunctional NADP(H):quinone oxidoreductase 1</article-title>. <source>Int. J. Biol. Macromol.</source> <volume>118</volume>, <fpage>1912</fpage>&#x2013;<lpage>1923</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijbiomac.2018.07.051</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pey</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Megarity</surname>
<given-names>C. F.</given-names>
</name>
<name>
<surname>Timson</surname>
<given-names>D. J.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>FAD binding overcomes defects in activity and stability displayed by cancer-associated variants of human NQO1</article-title>. <source>Biochim. Biophys. Acta</source> <volume>1842</volume>, <fpage>2163</fpage>&#x2013;<lpage>2173</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbadis.2014.08.011</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Radjendirane</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Joseph</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>Y. H.</given-names>
</name>
<name>
<surname>Kimura</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Klein-Szanto</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Gonzalez</surname>
<given-names>F. J.</given-names>
</name>
<etal/>
</person-group> (<year>1998</year>). <article-title>Disruption of the DT diaphorase (NQO1) gene in mice leads to increased menadione toxicity</article-title>. <source>J. Biol. Chem.</source> <volume>273</volume>, <fpage>7382</fpage>&#x2013;<lpage>7389</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.273.13.7382</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Remmert</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Biegert</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hauser</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>S&#xf6;ding</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>HHblits: Lightning-fast iterative protein sequence searching by HMM-HMM alignment</article-title>. <source>Nat. Methods</source> <volume>9</volume>, <fpage>173</fpage>&#x2013;<lpage>175</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.1818</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ross</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Siegel</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>NQO1 in protection against oxidative stress</article-title>. <source>Curr. Opin. Toxicol.</source> <volume>7</volume>, <fpage>67</fpage>&#x2013;<lpage>72</lpage>. <pub-id pub-id-type="doi">10.1016/j.cotox.2017.10.005</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salido</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Timson</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Betancor-Fern&#xe1;ndez</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Palomino-Morales</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Anoz-Carbonell</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Pacheco-Garc&#xed;a</surname>
<given-names>J. L.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Targeting HIF-1&#x3b1; function in cancer through the chaperone action of NQO1: Implications of genetic diversity of NQO1</article-title>. <source>J. Pers. Med.</source> <volume>12</volume>, <fpage>747</fpage>. <pub-id pub-id-type="doi">10.3390/jpm12050747</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siegel</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Bersie</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Harris</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>di Francesco</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Armstrong</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Reisdorph</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>A redox-mediated conformational change in NQO1 controls binding to microtubules and &#x3b1;-tubulin acetylation</article-title>. <source>Redox Biol.</source> <volume>39</volume>, <fpage>101840</fpage>. <pub-id pub-id-type="doi">10.1016/j.redox.2020.101840</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stein</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fowler</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Hartmann-Petersen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lindorff-Larsen</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Biophysical and mechanistic models for disease-causing protein variants</article-title>. <source>Trends biochem. Sci.</source> <volume>44</volume>, <fpage>575</fpage>&#x2013;<lpage>588</lpage>. <pub-id pub-id-type="doi">10.1016/j.tibs.2019.01.003</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Steinegger</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Meier</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mirdita</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>V&#xf6;hringer</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Haunsberger</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>S&#xf6;ding</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>HH-suite3 for fast remote homology detection and deep protein annotation</article-title>. <source>BMC Bioinforma.</source> <volume>20</volume>, <fpage>473</fpage>. <pub-id pub-id-type="doi">10.1186/s12859-019-3019-7</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vankova</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Salido</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Timson</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Man</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Pey</surname>
<given-names>A. L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A dynamic core in human NQO1 controls the functional and stability effects of ligand binding and their communication across the enzyme dimer</article-title>. <source>Biomolecules</source> <volume>9</volume>, <fpage>728</fpage>. <pub-id pub-id-type="doi">10.3390/biom9110728</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Watson</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Monroe</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Raleigh</surname>
<given-names>D. P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Size-dependent relationships between protein stability and thermal unfolding temperature have important implications for analysis of protein energetics and high-throughput assays of protein-ligand interactions</article-title>. <source>J. Phys. Chem. B</source> <volume>122</volume>, <fpage>5278</fpage>&#x2013;<lpage>5285</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jpcb.7b05684</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Katsonis</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Lichtarge</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Bovo</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Benchmarking predictions of allostery in liver pyruvate kinase in CAGI4</article-title>. <source>Hum. Mutat.</source> <volume>38</volume>, <fpage>1123</fpage>&#x2013;<lpage>1131</lpage>. <pub-id pub-id-type="doi">10.1002/humu.23222</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>