<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2023.1073789</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Nuclear translocation of spike mRNA and protein is a novel feature of SARS-CoV-2</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Sattar</surname>
<given-names>Sarah</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="fn0003" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2100520/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kabat</surname>
<given-names>Juraj</given-names>
</name>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<xref rid="fn0003" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1919742/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jerome</surname>
<given-names>Kailey</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Feldmann</surname>
<given-names>Friederike</given-names>
</name>
<xref rid="aff3" ref-type="aff"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bailey</surname>
<given-names>Kristina</given-names>
</name>
<xref rid="aff4" ref-type="aff"><sup>4</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/60928/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Mehedi</surname>
<given-names>Masfique</given-names>
</name>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
<xref rid="c001" ref-type="corresp"><sup>&#x002A;</sup></xref>
<xref rid="fn0003" ref-type="author-notes"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/223864/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Biomedical Sciences, University of North Dakota School of Medicine and Health Sciences</institution>, <addr-line>Grand Forks, ND</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Biological Imaging Section, Research Technology Branch, National Institute of Allergy and Infectious Diseases, National Institutes of Health</institution>, <addr-line>Bethesda, MD</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>Division of Intramural Research, National Institute of Allergy and Infectious Diseases, National Institutes of Health</institution>, <addr-line>Hamilton, MT</addr-line>, <country>United States</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Internal Medicine, Pulmonary, Critical Care, and Sleep and Allergy, University of Nebraska Medical Center</institution>, <addr-line>Omaha, NE</addr-line>, <country>United States</country></aff>
<author-notes>
<fn id="fn0001" fn-type="edited-by"><p>Edited by: Patrick C. Y. Woo, National Chung Hsing University, Taiwan</p></fn>
<fn id="fn0002" fn-type="edited-by"><p>Reviewed by: Hyung-Joo Kwon, Hallym University, Republic of Korea; Milan Surjit, Translational Health Science and Technology Institute, India</p></fn>
<corresp id="c001">&#x002A;Correspondence: Masfique Mehedi, <email>masfique.mehedi@und.edu</email></corresp>
<fn id="fn0003" fn-type="equal"><p><sup>&#x2020;</sup>These authors have contributed equally to this work</p></fn>
<fn id="fn0004" fn-type="other"><p>This article was submitted to Virology, a section of the journal Frontiers in Microbiology</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>26</day>
<month>01</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1073789</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>10</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>12</day>
<month>01</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2023 Sattar, Kabat, Jerome, Feldmann, Bailey and Mehedi.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Sattar, Kabat, Jerome, Feldmann, Bailey and Mehedi</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2) causes severe pathophysiology in vulnerable older populations and appears to be highly pathogenic and more transmissible than other coronaviruses. The spike (S) protein appears to be a major pathogenic factor that contributes to the unique pathogenesis of SARS-CoV-2. Although the S protein is a surface transmembrane type 1 glycoprotein, it has been predicted to be translocated into the nucleus due to the novel nuclear localization signal (NLS) &#x201C;PRRARSV,&#x201D; which is absent from the S protein of other coronaviruses. Indeed, S proteins translocate into the nucleus in SARS-CoV-2-infected cells. S mRNAs also translocate into the nucleus. S mRNA colocalizes with S protein, aiding the nuclear translocation of S mRNA. While nuclear translocation of nucleoprotein (N) has been shown in many coronaviruses, the nuclear translocation of both S mRNA and S protein reveals a novel feature of SARS-CoV-2.</p>
</abstract>
<kwd-group>
<kwd>SARS-CoV-2</kwd>
<kwd>spike</kwd>
<kwd>NLS</kwd>
<kwd>nuclear translocation</kwd>
<kwd>mRNA</kwd>
</kwd-group>
<contract-num rid="cn1">P20GM113123 and T34GM122835</contract-num>
<contract-num rid="cn2">101-BX005413</contract-num>
<contract-sponsor id="cn1">NIH/NIGMS</contract-sponsor>
<contract-sponsor id="cn2">NIAID, NIH</contract-sponsor>
<counts>
<fig-count count="6"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="54"/>
<page-count count="12"/>
<word-count count="9682"/>
</counts>
</article-meta>
</front>
<body>
<sec id="sec1" sec-type="intro">
<title>Introduction</title>
<p>The recently emerged severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2), along with SARS-CoV and Middle East respiratory syndrome coronavirus (MERS-CoV), belong to the <italic>Coronaviridae</italic> virus family. The current ongoing outbreak has shown that SARS-CoV-2 is highly pathogenic and more transmissible than SARS-CoV or MERS-CoV (<xref ref-type="bibr" rid="ref21">Liu et al., 2020</xref>). These coronaviruses contain a positive-strand RNA genome with a few unique features: two-thirds of the viral RNA is translated into a large polyprotein, and the remainder of the viral genome is transcribed by a discontinuous transcription process into a nested set of subgenomic mRNAs (<xref ref-type="bibr" rid="ref33">Pasternak et al., 2006</xref>; <xref ref-type="bibr" rid="ref35">Perlman and Netland, 2009</xref>; <xref ref-type="bibr" rid="ref42">Sola et al., 2015</xref>). The different subgenomic RNAs encode four conserved structural proteins (spike, S; envelope, E; membrane, M, and nucleocapsid, N) and several accessory proteins (<xref ref-type="bibr" rid="ref4">Bojkova et al., 2020</xref>; <xref ref-type="bibr" rid="ref10">Finkel et al., 2021</xref>). The S protein of both SARS-CoV and SARS-CoV-2 interacts with the host cell receptor angiotensin converting enzyme 2 (ACE2) and triggers fusion between the viral envelope and host cell membrane to facilitate successful viral entry (<xref ref-type="bibr" rid="ref17">Jia et al., 2005</xref>; <xref ref-type="bibr" rid="ref15">Hoffmann et al., 2020</xref>). However, the S protein of MERS-CoV binds to dipentidyl peptidase (DPP4) to facilitate entry into cells (<xref ref-type="bibr" rid="ref37">Raj et al., 2013</xref>). Importantly, the SARS-CoV-2&#x2009;S protein is a significant pathogenic factor because of its broad tropism for mammalian ACE2 (<xref ref-type="bibr" rid="ref6">Conceicao et al., 2020</xref>). While the S protein is an attractive target for therapeutic development (<xref ref-type="bibr" rid="ref22">Martinez-Flores et al., 2021</xref>), the lack of comprehensive information on S protein expression and subcellular translocation hinders the identification of an effective S protein-targeting therapeutic to combat SARS-CoV-2 infection.</p>
<p>The genome sequence is generally the blueprint for detecting biological function (<xref ref-type="bibr" rid="ref13">Harrow et al., 2009</xref>). Thus, the S protein&#x2019;s function is encoded in the S gene sequence. Identifying novel features in the S gene sequence, its expression and subcellular localization may shed light on the unique pathogenesis of SARS-CoV-2 compared to other pathogenic beta-coronaviruses, particularly SARS-CoV and MERS-CoV. A recent study showed several SARS-CoV-2 genomic features, including novel sequence insertions and enhanced N protein nuclear localization signals (NLSs) that are thought to be responsible for the unique pathogenesis of this coronavirus (<xref ref-type="bibr" rid="ref12">Gussow et al., 2020</xref>). There are three types of NLSs: pat4, pat7, and bipartite. The pat4 signal is a chain of 4 basic amino acids consisting of lysine or arginine or three basic amino acids, with the last amino acid being either histidine or proline. The pat7 signal begins with proline and is followed by six amino acids, which contains a four-residue sequence in which three of the four residues are basic. The bipartite signal consists of two basic amino acids with a 10-residue spacer and a five amino acid sequence in which at least three of the five amino acids are basic (<xref ref-type="bibr" rid="ref38">Robbins et al., 1991</xref>; <xref ref-type="bibr" rid="ref14">Hicks and Raikhel, 1995</xref>; <xref ref-type="bibr" rid="ref39">Rowland et al., 2005</xref>). The subcellular localization of some SARS-CoV-2 proteins has been studied <italic>in vitro</italic> (<xref ref-type="bibr" rid="ref52">Zhang J. et al., 2020</xref>), but a comprehensive understanding of the subcellular localization of the S protein is missing.</p>
<p>Here, we first report the nuclear translocation of S protein and mRNA in SARS-CoV-2-infected cells. The translocation of the SARS-CoV-2&#x2009;S mRNA appeared to be assisted by the S protein, which contains an NLS motif that is unique among human pathogenic beta-coronaviruses.</p>
</sec>
<sec id="sec2" sec-type="results">
<title>Results</title>
<sec id="sec3">
<title>The novel NLS motif &#x201C;PRRARSV&#x201D; is in the S protein of SARS-CoV-2 but not SARS-CoV or MERS-CoV</title>
<p>Several groups have reported novel nucleotide insertions in the S gene of SARS-CoV-2, as indicated by a multiple sequence alignment for the S protein sequences of different coronaviruses, such as a polybasic site &#x201C;PRRA&#x201D; produced by a 12-nucleotide acquisition at the S1-S2 boundary through multiple host-species adaptations (<xref ref-type="bibr" rid="ref2">Andersen et al., 2020</xref>; <xref ref-type="bibr" rid="ref47">Walls et al., 2020</xref>). However, S protein sequence alignments between SARS-CoV-2 and SARS-CoV showed the possibility of the insertions &#x201C;NSPR&#x201D; (<xref ref-type="bibr" rid="ref54">Zhang C. et al., 2020</xref>) and &#x201C;SPRR&#x201D; (<xref ref-type="bibr" rid="ref50">Xie et al., 2020</xref>) at the S1-S2 boundary. It has previously been reported that the sequence insertion at the S1-S2 boundary constitutes a furin cleavage site (<xref ref-type="bibr" rid="ref26">Ord et al., 2020</xref>; <xref ref-type="bibr" rid="ref34">Peacock et al., 2021</xref>). A comprehensive understanding of the consequence of the sequence insertion at the S1-S2 boundary is still missing, possibly because research focused on understanding the differences in the pathogenicity of the different SARS-CoV-2 variants and subvariants, which emerged rapidly. To determine whether the earlier SARS-CoV-2 isolate (USA/WA-CDC-WA1/2020 isolate, GenBank accession no. MN985325) has multiple novel sequence insertions in the S protein compared to SARS-CoV (Urbani strain, GenBank accession no. AY278741), we aligned the S protein sequences of both viruses using a constraint-based alignment tool for multiple protein sequences (COBALT) (<xref ref-type="bibr" rid="ref31">Papadopoulos and Agarwala, 2007</xref>). We did not use MER-CoV for comparison because there is only 40% similarity between SARS-CoV-2 and MERS-CoV (<xref ref-type="bibr" rid="ref16">Hu et al., 2020</xref>). Similar to a previous report (<xref ref-type="bibr" rid="ref54">Zhang C. et al., 2020</xref>), we found sequence insertions (IS) in the SARS-CoV-2&#x2009;S protein at four independent positions: IS1 &#x201C;GTNGKTR,&#x201D; IS2 &#x201C;YYHK,&#x201D; IS3 &#x201C;HRSY,&#x201D; and IS4 &#x201C;NSPR&#x201D; (<xref rid="fig1" ref-type="fig">Figures 1A</xref>, <xref rid="fig1" ref-type="fig">B</xref>). To determine whether any of these sequence insertions constituted or resembled any protein motifs, such as an NLS, we analyzed the SARS-CoV-2&#x2009;S protein <italic>in silico</italic> with the PSORT II web portal for NLS prediction (<xref ref-type="bibr" rid="ref25">Nakai and Horton, 1999</xref>). We found that the SARS-CoV-2 glycoprotein contained an NLS of the &#x201C;pat7&#x201D; motifs, one of the three NLS motifs described above (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S1</xref>). To our surprise, the NLS motif &#x201C;PRRARSV&#x201D; was present at the proposed polybasic site and was due to the fourth sequence insertion &#x201C;NSPR&#x201D; (<xref rid="fig1" ref-type="fig">Figures 1A</xref>, <xref rid="fig1" ref-type="fig">B</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S1</xref>). As expected, the NLS in the S protein was unique to SARS-CoV-2 among human pathogenic beta-coronaviruses, as neither the SARS-CoV S protein nor the MERS-CoV S protein has an NLS (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S1</xref>).</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Only the SARS-CoV-2&#x2009;S protein had an NLS motif &#x201C;PRRARSV&#x201D; due to a novel sequence insertion. <bold>(A)</bold> Full-length SARS-CoV-2 genome (nucleotide) (USA/WA-CDC-WA1/2020 isolate, GenBank accession no. MN985325) and open reading frames (ORF) are shown at the top. The SARS-CoV-2&#x2009;S protein amino acid sequence was aligned with SARS-CoV (Urbani strain, GenBank accession no. AY278741) by NCBI&#x2019;s constraint-based multiple alignment tool COBALT (<xref ref-type="bibr" rid="ref31">Papadopoulos and Agarwala, 2007</xref>), and the relative positions of four novel sequence insertions (ISs) are shown in the S protein ORF as follows: IS1: &#x201C;GTNGKTR,&#x201D; IS2: &#x201C;YYHK,&#x201D; IS3: &#x201C;HRSY,&#x201D; and IS4: &#x201C;NSPR.&#x201D; The fourth IS (NSPR) created a pat7 NLS &#x201C;PRRARSV&#x201D; in the S protein (shown in the red rectangle). <bold>(B)</bold> The S protein ORF sequences between SARS-CoV-2 and SARS-CoV were aligned, and the Lined rectangles highlight the four novel insertions: IS1, IS2, IS3, and IS4. The IS4 &#x201C;NSPR&#x201D; created a pat7 NLS &#x201C;PRRARSV&#x201D; in the S protein (shown in the black rectangle).</p>
</caption>
<graphic xlink:href="fmicb-14-1073789-g001.tif"/>
</fig>
</sec>
<sec id="sec4">
<title>NLS-driven nuclear translocation of S protein (including S mRNA) occurs only in the SARS-CoV-2-infected airway epithelium</title>
<p>Although viral glycoprotein nuclear translocation is rare, NLS-driven protein nuclear translocation has already been established in different viral infections (<xref ref-type="bibr" rid="ref30">Ozawa et al., 2007</xref>; <xref ref-type="bibr" rid="ref3">Boisvert et al., 2014</xref>). Thus, it is important to determine whether the SARS-CoV-2&#x2009;S protein translocates into the nucleus in addition to its canonical cell surface localization through the ER-Golgi pathway. We hypothesized that the S protein could translocate into the nucleus in SARS-CoV-2-infected cells <italic>via</italic> the identified NLS motif (<xref ref-type="bibr" rid="ref39">Rowland et al., 2005</xref>; <xref ref-type="bibr" rid="ref30">Ozawa et al., 2007</xref>; <xref ref-type="bibr" rid="ref3">Boisvert et al., 2014</xref>). We infected highly differentiated pseudostratified airway epithelial cells (which mimics <italic>in vivo</italic> human airway epithelium) with SARS-CoV-2 at a multiplicity of infection (MOI) of 0.1 for 4 days. First, we confirmed the presence of S mRNA and S protein in a 5&#x2009;&#x03BC;m section of formalin-fixed paraffin-embedded SARS-CoV-2-infected cells by RNAscope and immunofluorescence analysis. Despite the rarity of viral mRNA (or even positive-strand RNA virus genome) to be nuclear (<xref ref-type="bibr" rid="ref48">Whittaker and Helenius, 1998</xref>; <xref ref-type="bibr" rid="ref46">Vargas et al., 2005</xref>), a recent study showed that SARS-CoV-2 mRNA accumulates in the nucleus of infected cells (<xref ref-type="bibr" rid="ref1">Addetia et al., 2021</xref>). Our results showed that SARS-CoV-2&#x2009;S mRNA was nuclear (<xref rid="fig2" ref-type="fig">Figure 2</xref> left panel and merged images in the right panel). To confirm the physical apposition between S mRNA and the nucleus by comparing their distributions in fluorescent images, we used the spot-to-spot colocalization function in Imaris image analysis software (Oxford Instruments). We found that S mRNA was nuclear and abundant in the cytoplasm (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S2</xref>, top panel, three donors). To avoid image artifacts, we imaged multiple independent slides of SARS-CoV-2-infected airway epithelium (from three independent donors) using at least two different high-end confocal microscopes. Additionally, we used at least two different image processing strategies to determine nuclear localization. Based on high-resolution imaging, we determined the subcellular distribution of S mRNA at near single-molecule and single-cell levels (<xref rid="fig2" ref-type="fig">Figures 2</xref>, <xref rid="fig3" ref-type="fig">3A</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figures S2, S3</xref>). Importantly, we were able to determine S mRNA nuclear translocation not only inside the nucleus but also on the nuclear surface (<xref rid="fig3" ref-type="fig">Figures 3A</xref>, <xref rid="fig3" ref-type="fig">C</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). The determination of S mRNA distribution and abundance showed that S mRNA subcellular localization spans from the inside and outer surface of the nuclear membrane to everywhere in the cytoplasm. We found that almost 90% of S mRNA was distributed in the cytoplasm, which was expected, as SARS-CoV-2 transcription and replication occur in the cytoplasm (<xref rid="fig3" ref-type="fig">Figures 3A</xref>, <xref rid="fig3" ref-type="fig">C</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). Interestingly, less than 10% of S mRNA was detected at the nuclear surface, which could explain the transitionary stage of S mRNA before it enters the nucleus or the novel transnuclear-membrane translocation of S mRNA, which was examined and described later (<xref rid="fig3" ref-type="fig">Figures 3A</xref>, <xref rid="fig3" ref-type="fig">C</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). In approximately 1% of instances, S mRNA successfully translocated into the nucleus (<xref rid="fig3" ref-type="fig">Figures 3A</xref>, <xref rid="fig3" ref-type="fig">C</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). The nuclear translocation of S mRNA is highly unusual because there have been few previous reports of S mRNA nuclear translocation and no information on the mechanism of nuclear translocation. However, we have explored how S mRNA could translocate into the nucleus.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>The intracellular distribution of S mRNA and S protein suggests nuclear translocation. Four-week highly differentiated pseudostratified airway epithelium was infected with SARS-CoV-2 at a MOI of 0.1 for 4 days, paraformaldehyde-fixed, paraffin-embedded, and sectioned at a thickness of 5&#x2009;&#x03BC;m for immunohistochemistry (IHC) and slide preparation (<xref ref-type="bibr" rid="ref28">Osan et al., 2020</xref>, <xref ref-type="bibr" rid="ref27">2021</xref>). A combined protocol of RNAscope and IHC was used to simultaneously detect S mRNA and S protein in the SARS-CoV-2-infected airway epithelium. S mRNA (red) was detected using a SARS-CoV-2&#x2009;S mRNA probe for RNAscope, and S protein (cyan) was detected by an S protein-specific rabbit polyclonal antibody and a corresponding anti-rabbit secondary antibody for immunofluorescence (IFA) analysis. The nucleus (blue) was detected by DAPI staining. The images were taken under an Olympus confocal microscope using a 60x oil objective. The images represent multiple independent technical replicates from two independent experiments with different donors (experiment 1: donors 2 and 3 and experiment 2: donor 1). The scale bar is 10&#x2009;&#x03BC;m.</p>
</caption>
<graphic xlink:href="fmicb-14-1073789-g002.tif"/>
</fig>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>The nuclear translocation of S protein and S mRNA includes both the outer surface and inside of the nucleus. Separate slides (see <xref rid="fig2" ref-type="fig">Figure 2</xref>) were imaged under a Leica Stellaris confocal microscope (Leica) using a 63x oil objective. The images were then deconvolved using Huygen Essential deconvolution software (Scientific Volume Imaging). Using the surface rendering function of an image processing IMARIS software. <bold>(A)</bold> S mRNA (red) on the nuclear surface (top) and inside the nucleus (bottom). White arrows indicate S protein on the nuclear surface (top image) or inside the nucleus (bottom image). <bold>(B)</bold> S protein (green) on the nuclear surface (top image) and inside the nucleus (bottom image). White arrows indicate S protein on the nuclear surface (top image) or inside the nucleus (bottom image). <bold>(C)</bold> The total distribution of S mRNA and S protein in the cells. The data were obtained by combining multiple images from an independent experiment. <bold>(D)</bold> The total colocalization between S mRNA and S protein in the cells. The data were obtained by combining multiple images from an independent experiment.</p>
</caption>
<graphic xlink:href="fmicb-14-1073789-g003.tif"/>
</fig>
<p>We investigated whether the S protein translocated into the nucleus in the SARS-CoV-2-infected airway epithelium. Consistent with the S mRNA data, we found that the S protein translocated into the nucleus and was abundant on the cellular surface through the cytoplasmic ER-Golgi pathway (<xref rid="fig2" ref-type="fig">Figure 2</xref>, middle panel and merged images in the right panel). Based on high-resolution imaging, we determined that S protein nuclear translocation included both the inside of the nucleus and the nuclear surface (<xref rid="fig3" ref-type="fig">Figures 3B</xref>, <xref rid="fig3" ref-type="fig">C</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). Similar to S mRNA quantification, we were able to quantify the distribution and abundance of S protein in the infected airway epithelium. We found that the S protein was distributed inside and in the outer membrane of the nucleus, the cytoplasmic ER-Golgi and the cell surface. We did not determine what portion of the S protein was localized inside and outside the cell surface. However, we quantified the subcellular distribution of the S protein inside the nucleus, outside the surface of the nucleus, and in the cytoplasm, which included cell surface expression because the S protein is a type 1 transmembrane glycoprotein. We found that approximately 75% of the S protein was distributed in sites other than the nucleus, including the cell surface and the cytoplasm, which was expected, as S protein translation and protein processing occur in the cytoplasm and <italic>via</italic> cytoplasmic ER-Golgi pathway, respectively (<xref rid="fig3" ref-type="fig">Figures 3B</xref>, <xref rid="fig3" ref-type="fig">C</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). Interestingly, approximately 15% of the S protein was detected at the nuclear surface, which could explain the S protein transitionary stage before entering the nucleus or a novel transnuclear-membrane translocation of S protein, which was examined and described later (<xref rid="fig3" ref-type="fig">Figures 3A</xref>, <xref rid="fig3" ref-type="fig">C</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). Interestingly, we found that a higher percentage of total S protein translocated into the nucleus than S mRNA (<xref rid="fig3" ref-type="fig">Figures 3A</xref>&#x2013;<xref rid="fig3" ref-type="fig">C</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S3</xref>). Although viral type-1 transmembrane glycoprotein translocation into the nucleus is rare, the NLS in the S protein is responsible for nuclear translocation. It was apparent that NLS-driven S protein nuclear translocation was SARS-CoV-2 specific, and a side-by-side infection experiment with both viruses showed that the S protein of SARS-CoV did not translocate into the nucleus (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S4</xref>). As both S mRNA and S protein translocated into the nucleus, it is important to determine whether S mRNA and S protein colocalize in different subcellular sites.</p>
</sec>
<sec id="sec5">
<title>Colocalization of S mRNA and S protein in different subcellular locations in the SARS-CoV-2-infected airway epithelium</title>
<p>While we can explain S protein nuclear translocation due to the presence of an NLS motif in the amino acid sequence, we can only hypothesize that S mRNA nuclear translocation is possible due to a direct interaction between S protein and S mRNA, which can be explained by the colocalization between them. The SARS-CoV-2&#x2009;N protein is an abundant RNA binding protein that is essential for viral genome packaging (<xref ref-type="bibr" rid="ref7">Cubuk et al., 2021</xref>). While the structural basis of N protein binding to single-or double-stranded RNA is known (<xref ref-type="bibr" rid="ref9">Dinesh et al., 2020</xref>), there is no information about whether S protein binds to S mRNA. As we found similar intracellular distribution of both S mRNA and S protein, we hypothesized that S protein interacts with S mRNA to translocate the protein&#x2013;mRNA complex to different subcellular locations, including the cytoplasm and nucleus, but not the cell surface. By examining the colocalization between the S protein and S mRNA, we could confirm the presence of the protein&#x2013;mRNA complex in the SARS-CoV-2-infected airway epithelium. Here, we refer to colocalization as an association between S mRNA and S protein at different intracellular locations. Technically, two separate fluorescence molecules that emit different wavelengths of light are superimposed within an indeterminate microscope resolution. To determine whether S mRNA and S protein colocalize, we used a high-resolution imaging strategy. We quantified the colocalization on a percentage scale. We found that approximately 85% of the colocalization, which was the highest, was observed outside the nucleus (<xref rid="fig3" ref-type="fig">Figure 3D</xref>). These data are consistent with the previously described spatial expression data of both S protein and S mRNA (<xref rid="fig3" ref-type="fig">Figures 3A</xref>&#x2013;<xref rid="fig3" ref-type="fig">C</xref>). As expected, lower and the lowest percentages of colocalization between the S protein and S mRNA were observed on the nuclear surface and inside the nucleus, respectively (<xref rid="fig3" ref-type="fig">Figure 3D</xref>). We were able to pinpoint the colocalization site by using high magnification confocal imaging followed by image processing. Representatives of S mRNA and S protein colocalization in the cytoplasm (<xref rid="fig4" ref-type="fig">Figure 4</xref>, top two panels), on the surface of the nuclear membrane (<xref rid="fig4" ref-type="fig">Figure 4</xref>, middle two panels), or inside the nucleus (<xref rid="fig4" ref-type="fig">Figure 4</xref>, bottom two panels) are shown. We observed S protein and S mRNA colocalization in three subcellular locations, which was confirmed at the single-cell level in SARS-CoV-2-infected cells (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S5</xref>). We also observed that S mRNA inside and on the nuclear surface was associated with the S protein, in contrast to the cytoplasmic S mRNA distribution with or without colocalization with the S protein (<xref rid="fig4" ref-type="fig">Figure 4</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S5</xref>). Thus, S mRNA translocates into the nucleus through the S protein-S mRNA complex and is driven by the S protein (<xref rid="fig4" ref-type="fig">Figure 4</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S5</xref>).</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Colocalization between S mRNA and S protein inside infected cells. The images (see <xref rid="fig3" ref-type="fig">Figure 3</xref>) were analyzed by using the surface rendering and colocalization features of IMARIS. S protein and S mRNA distribution and colocalization in the cytoplasm (top panel), on the nuclear surface (middle panel) and inside the nucleus (bottom panel). The specific region of colocalization is indicated by a white spot. Scale bar 0.5&#x2009;&#x03BC;m.</p>
</caption>
<graphic xlink:href="fmicb-14-1073789-g004.tif"/>
</fig>
</sec>
<sec id="sec6">
<title>SARS-CoV-2 S protein&#x2019;s transient expression confirms its nuclear translocation in the transfected cells</title>
<p>To determine whether SARS-CoV-2&#x2009;S protein&#x2019;s nuclear translocation is independent of other viral protein&#x2019;s involvement, we transfected primary normal human bronchial epithelial (NHBE) cells with a recombinant plasmid containing codon-optimized full-length DNA sequence of SARS-CoV-2&#x2009;S protein (<xref ref-type="bibr" rid="ref20">Leventhal et al., 2021</xref>) for 48&#x2009;h. We used an immunofluorescent assay (IFA) to detect the S protein in the transfected cells. We found a broader subcellular distribution of S protein (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S6A</xref>). Both vertical and horizontal cross-sections of the epifluorescence images showed that the fluorescence signal of the S protein overlapped the nuclear stain. However, it was prudent to determine whether the observed S protein nuclear distribution is independent of its abundant endoplasmic reticulum (ER) distribution, as it is processed there before translocating to the cell surface. Thus, we further investigated the S protein&#x2019;s nuclear translocation in the lung epithelial A549 cells. We first co-stained the S protein and a common ER protein, calnexin. We found that S protein sub-cellular distribution beyond ER, which complemented our previous finding of its nuclear translocation (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S6B</xref>). However, we need to show S protein translocated into the nucleus in the transfected A549 cells. We co-stained the S protein and lamin B1, a nuclear inner membrane protein. We found that S protein fluorescence overlapped with the lamin B1 suggesting S protein&#x2019;s nuclear translocation in the transfected A549 cells (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S6C</xref>). S protein nuclear distribution was distinct from the eGFP&#x2019;s diffusive expression throughout the cells (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S6C</xref>). In addition to a fluorescent-based detection strategy, we used a biochemical approach to confirm the S protein&#x2019;s nuclear translocation. We hypothesized that the SARS-CoV-2&#x2009;S protein should be detected in nuclear and cytoplasmic fractionating to the SARS-CoV-2&#x2009;S plasmid transfected cells. We transfected A549 cells with the same plasmid for 72&#x2009;h. For control, we similarly mock-transfected A549 cells without the plasmid. We collected cytoplasmic and nuclear fractions of the S protein plasmid transfected or mock-transfected using ReadiPrep Nuclear/Cytoplasmic Fraction kit (AAT Bioquest) according to the manufacturer&#x2019;s instructions. We found S protein in both the nuclear and cytoplasmic fractions of the transfected A549 cells (<xref rid="fig5" ref-type="fig">Figure 5</xref>). We detected lamin A and C and cell division cycle protein 42 (Cdc42) on the same gel to confirm no mix-up between nuclear and cytoplasmic portions. While lamin A and C were detected in the nuclear portion, Cdc42 was detected only in the cytoplasmic portion (<xref rid="fig5" ref-type="fig">Figure 5</xref>). Our results suggested that transient expression of the SARS-CoV-2&#x2009;S protein caused its wider subcellular distribution, including the nucleus in the transfected cells.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>S protein in both cytoplasmic and nuclear fraction of the transfected A549 cells. A549 cells were transfected with SARS-CoV-2&#x2009;S plasmid (<xref ref-type="bibr" rid="ref20">Leventhal et al., 2021</xref>) for 72&#x2009;h. SARS-CoV-2&#x2009;S protein was detected in both cytoplasmic and nuclear fractions by Western blotting. Cdc-42 detection confirms cytoplasmic portion and Lamin A and C detection confirms nuclear fraction.</p>
</caption>
<graphic xlink:href="fmicb-14-1073789-g005.tif"/>
</fig>
</sec>
<sec id="sec7">
<title>NLS-driven N protein nuclear translocation is common in SARS-CoV, MERS-CoV, and SARS-CoV-2 infections</title>
<p>There is no comprehensive information on SARS-CoV-2&#x2009;N protein NLS motifs, and we already know that other pathogenic coronaviruses, particularly SARS-CoV (<xref ref-type="bibr" rid="ref39">Rowland et al., 2005</xref>; <xref ref-type="bibr" rid="ref45">Timani et al., 2005</xref>) and MERS-CoV (<xref ref-type="bibr" rid="ref51">Yang et al., 2013</xref>) N proteins, have NLSs. Therefore, we searched for NLSs in the SARS-CoV-2&#x2009;N protein by using the PSORT II. We found that the SARS-CoV-2&#x2009;N protein has 7 NLSs covering all three types of NLS motifs (pat4: 2; pat7: 3, and bipartite: 2); however, the SARS-CoV N protein has 8 NLS motifs (pat4: 2; pat7: 4, and bipartite: 2) (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S7</xref>). N protein translocation into the nucleus or at least the perinuclear region was confirmed (<xref rid="fig6" ref-type="fig">Figure 6A</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S8</xref>). However, SARS-CoV-2&#x2009;N protein nuclear translocation was not as robust as SARS-CoV nuclear translocation (<xref rid="fig6" ref-type="fig">Figure 6B</xref>; <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure S8</xref>). The reduced nuclear translocation of the SARS-CoV-2&#x2009;N protein is probably due to the absence of one pat7 NLS motif in the SARS-CoV-2&#x2009;N protein compared to that in SARS-CoV (<xref rid="SM1" ref-type="supplementary-material">Supplementary Figures S8, S9</xref>).</p>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>The nucleoproteins of SARS-CoV, MERS-CoV, and SARS-CoV-2 translocate into the nucleus. <bold>(A)</bold> Four-week pseudostratified airway epithelium was infected with SARS-CoV-2 at a MOI of 0.1 for 4 days, fixed, paraffin-embedded, and sectioned at a thickness of 5&#x2009;&#x03BC;m for immunohistochemistry slide preparation. Simultaneous detection of S mRNA (shown in red) and N protein (shown in cyan) on the same slide was performed by a combined detection protocol in RNAscope-based mRNA and immunofluorescence-based protein detection. An S mRNA-specific probe was used for RNAscope, and an N protein-specific rabbit polyclonal antibody and the corresponding anti-rabbit secondary antibody were used. The nucleus (shown in blue) was detected by DAPI staining. The images were taken under an Olympus confocal microscope using a 60x oil objective. The images represent multiple independent technical replicates from two independent, healthy donors (top row: donor #1 and bottom row: donor #2). The scale bar is 10&#x2009;&#x03BC;m. <bold>(B)</bold> Four-week pseudostratified airway epithelium was infected with SARS-CoV-2, SARS-CoV, or MERS-CoV at an MOI of 0.1 for 4 days. SARS-CoV-2 or SARS-CoV N protein was detected by an N protein-specific rabbit polyclonal antibody and corresponding anti-rabbit secondary antibody. Similarly, the MERS N protein was detected by MERS N protein-specific primary and corresponding secondary antibodies. The nucleus (shown in blue) was detected by DAPI staining. The images represent multiple independent technical replicates from one experiment (donor #1).</p>
</caption>
<graphic xlink:href="fmicb-14-1073789-g006.tif"/>
</fig>
</sec>
</sec>
<sec id="sec8" sec-type="discussions">
<title>Discussion</title>
<p>In the context of SARS-CoV, one of the controversies regarding the natural origin of SARS-CoV-2 is that its S gene has multiple novel sequence insertions. Zhang C. et al. analyzed the report by Pradhan et al. (withdrawn) (<xref ref-type="bibr" rid="ref36">Pradhan et al., 2020</xref>) on the presence of four unique novel sequences in the SARS-CoV-2&#x2009;S gene and showed that these four sequence insertions were not related to the receptor-binding domain (RBD) (<xref ref-type="bibr" rid="ref54">Zhang C. et al., 2020</xref>). A recent study identified S gene novel sequence insertions among several key genomic features that differentiate SARS-CoV-2 from other beta-coronaviruses, particularly SARS-CoV and MERS-CoV (<xref ref-type="bibr" rid="ref12">Gussow et al., 2020</xref>). The source and characterization of these sequence insertions have yet to be determined; however, the closest BLAST hit of these sequences is bat coronavirus RaTG13 (<xref ref-type="bibr" rid="ref11">Gibson et al., 1992</xref>). Similar to a previous report (<xref ref-type="bibr" rid="ref54">Zhang C. et al., 2020</xref>), we found four multiple sequence insertions in the SARS-CoV-2&#x2009;S protein: IS1 &#x201C;GTNGKTR,&#x201D; IS2 &#x201C;YYHK,&#x201D; &#x201C;HRSY,&#x201D; and IS4 &#x201C;NSPR&#x201D; (<xref rid="fig1" ref-type="fig">Figure 1</xref>). Here, we showed that the fourth novel sequence insertion in the S gene created a functional pat7 NLS motif and resulted in nuclear translocation of the S protein, which not only complemented previous <italic>in silico</italic> findings (<xref ref-type="bibr" rid="ref12">Gussow et al., 2020</xref>) but also identified a novel pathogenic genomic feature of the S gene. Surprisingly, the fourth sequence insertion has received attention due to the description of a proposed polybasic furin cleavage site &#x201C;RRAR,&#x201D; which may contribute to increased serin protease-driven entry of SARS-CoV-2 (<xref ref-type="bibr" rid="ref2">Andersen et al., 2020</xref>) and is implicated in broader tropism and/or enhanced viral transmissibility compared to SARS-CoV (<xref ref-type="bibr" rid="ref47">Walls et al., 2020</xref>). Interestingly, the proposed SARS-CoV-2 furin cleavage site (P-R-R-A-R) considered as noncanonical, as a consensus recognition sequences for furin proteases is (X-Arg-X-Lys/Arg-Arg-X) (<xref ref-type="bibr" rid="ref18">Klimstra et al., 1999</xref>; <xref ref-type="bibr" rid="ref5">Chan and Zhan, 2022</xref>). Thus a generic furin consensus cleavage site motif should contain the canonical four amino acid motif R-X-[K/R]-R, although R-X-X-R is the minimal cleavage site on the substrate for successful furin cleavage (<xref ref-type="bibr" rid="ref19">Krysan et al., 1999</xref>; <xref ref-type="bibr" rid="ref44">Tian et al., 2011</xref>). However, we found that the IS4 &#x201C;NSPR&#x201D; created a pat7 NLS &#x201C;PRRARSV&#x201D; in the S protein, which was unique to SARS-CoV-2. Whether this noncanonical furin cleavage destroys the function of the NLS motif is important to determine, as the proposed noncanonical furin cleavage site is constitutively within the NLS motif (described later). Due to the specificity of the amino acid motif, a furin cleavage motif is not expected to fulfill the characteristics of an NLS motif. We first reported that the S protein translocated into the nucleus in the SARS-CoV-2-infected airway epithelium, which is an appropriate lung model for studying respiratory virus infection <italic>in vitro</italic> (<xref ref-type="bibr" rid="ref27">Osan et al., 2021</xref>, <xref ref-type="bibr" rid="ref29">2022</xref>). Our results confirmed that the SARS-CoV-2&#x2009;S protein was a unique addition to the list of viral proteins that possess NLSs and consequently translocate into the nucleus of infected cells (<xref ref-type="bibr" rid="ref39">Rowland et al., 2005</xref>; <xref ref-type="bibr" rid="ref30">Ozawa et al., 2007</xref>; <xref ref-type="bibr" rid="ref32">Parent, 2011</xref>; <xref ref-type="bibr" rid="ref3">Boisvert et al., 2014</xref>). We also confirmed S protein&#x2019;s nuclear translocation primarily due to its NLS motif, as transient expression of S protein in either primary NHBE cells or A549 cell line showed its broader subcellular distribution including nucleus. Among coronaviruses, SARS-CoV-2&#x2009;S protein is the first type-1 transmembrane glycoprotein that translocates into the nucleus. Vesicular stomatitis virus (VSV), which is a negative sense RNA virus, has a glycoprotein that translocates to the nucleus as well. A study by the University of Illinois at Urbana Champaign showed exactly how the glycoprotein on VSV was able to travel to the nucleus of hamster kidney cells (<xref ref-type="bibr" rid="ref8">DaPoian et al., 1996</xref>).</p>
<p>NLS-driven S protein nuclear translocation is a novel feature of SARS-CoV-2 infection compared to other pathogenic coronaviruses. However, the pathogenic contribution of the S protein&#x2019;s NLS motif to virus-induced pathophysiology is yet to be determined. Our results suggested that the S protein translocated into the nucleus due to the NLS, which also raised two important points. First, we investigated whether the proposed polybasic site &#x201C;RRAR&#x201D; could itself be an NLS motif. The answer was that the proposed polybasic site was not an NLS motif because an NLS is a well characterized and predefined amino acid sequence motif (<xref ref-type="bibr" rid="ref38">Robbins et al., 1991</xref>; <xref ref-type="bibr" rid="ref14">Hicks and Raikhel, 1995</xref>; <xref ref-type="bibr" rid="ref39">Rowland et al., 2005</xref>). Additionally, the amino acid sequence of the probable sequence insertion &#x201C;NSPR&#x201D; (<xref ref-type="bibr" rid="ref54">Zhang C. et al., 2020</xref>) was also not an NLS but was part of the P7 &#x201C;PRRARSV&#x201D; NLS. Thus, the inserted sequence creates the NLS in the S protein of SARS-CoV-2 and may make SARS-CoV-2 unique among human pathogenic coronaviruses.</p>
<p>The second important point was whether the NLS motif was functional in the context of the described polybasic site at the S1/S2 boundary. All type-1 transmembrane glycoproteins are processed through the ER-Golgi pathway before signal peptide-driven cellular surface localization. The proposed polybasic site was functional (availability to proteases) when the S protein was on the virion for host cell entry. A fully posttranslationally processed S protein surface translocation could also provide a polybasic site to be processed by furin cleavage. However, there is no information on the availability or usability of the S protein&#x2019;s polybasic site by furin proteases in the cytoplasm before virus assembly. Thus, the NLS is functional in SARS-CoV-2-infected cells, and the polybasic site only functions during the viral entry step. The NLS is obviously functional in infected cells, and no furin cleavage at the polybasic site is necessary other than for viral entry. Our results confirmed that the S protein NLS motif was functional in SARS-CoV-2-infected cells. Although mutating the polybasic site (which also mutated the NLS) may impact viral S protein function <italic>in vitro</italic>, the result will not confirm or deny that one is more important than the other between the polybasic site and the NLS. While our result does provide direct evidence for the presence of the NLS motif and nuclear translocation of the S protein, our results do not confirm nor deny that the NSPR sequence has a natural origin. Instead, our results showed that the inserted sequence NSPR created a functional NLS motif, which increased the intracellular distribution of the S protein, including novel nuclear translocation. The novel nuclear translocation of the SARS-CoV-2&#x2009;S protein suggests that: 1. the nuclear translocation of the S protein reduces its surface expression, but whether it contributes to evading host immune recognition remains to be determined; and 2. the colocalization of the S protein with S mRNA suggests that the S protein has an RNA binding motif, which remains to be determined. One of the important ways of confirming a functional NLS motif is to use site-directed mutational analysis. Plasmid-driven transient expression of S protein in the human lung airway A549 cell line and primary normal human branchial epithelial cells showed robust S expression but was toxic to the cells. Therefore, the success of site-directed mutational analysis of the S protein in a transient expression system is doubtful and the characterization of NLS by a mutational analysis is yet to be determined. Thus, our novel findings emphasize further research on the NLS motif of the SARS-CoV-2&#x2009;S protein.</p>
<p>One of the most important findings in our study was the simultaneous detection of the different spatial distributions of S protein and S mRNA at near single-molecule level in a single infected cell. We confirmed that S mRNA translocated into the nucleus by image analysis of the colocalization of S mRNA with nuclear staining. When SARS-CoV-2&#x2009;N protein has already been shown to bind to RNA (<xref ref-type="bibr" rid="ref40">Schmidt et al., 2021</xref>), we still do not know how exactly S protein binds to S mRNA for nuclear translocation. We only know is S mRNA nuclear translocation is more likely mediated by the S protein because S mRNA nuclear translocation was always associated with the S protein. Importantly, S mRNA colocalized with the S protein in the cytoplasm and nucleus (both inside and outside the surface of the nucleus). Our results support a previous machine learning based study findings SARS-CoV-2 RNA genome and sub-genomic RNAs can be translocated in the host cells&#x2019; mitochondrial matrix and nucleus (<xref ref-type="bibr" rid="ref49">Wu et al., 2020</xref>). Our results suggest that around 1% S mRNA translocated into the nucleus. S mRNA&#x2019;s (potentially SARS-CoV-2 mRNA genome) subcellular localization may play a significant role in SARS-CoV-2 pathogenesis. To determine whether the SARS-CoV-2 genome interacts with either S protein or N protein, we <italic>in silico</italic> analyzed RNA-protein interactions using the RPISeq web portal, which offers the only sequence-based prediction model (<xref ref-type="bibr" rid="ref24">Muppirala et al., 2011</xref>). We found that both S and N protein binding probability to the SARS-CoV-2 genome scored exactly 1 (Dataset S1 and S2). SARS-CoV-2&#x2009;N protein is an abundant RNA binding protein essential for viral genome packaging (<xref ref-type="bibr" rid="ref7">Cubuk et al., 2021</xref>). While the structural basis of N binding to single or double-stranded RNA is known (<xref ref-type="bibr" rid="ref9">Dinesh et al., 2020</xref>), we found that S mRNA nuclear translocation aids <italic>via</italic> S protein. However, the mechanism of S protein binding to the mRNA or possibly positive-strand RNA genome is yet to be determined. Although the primer-probe was designed to target S mRNA, the SARS-CoV-2 positive-strand RNA genome (whole or partial) can be targeted by the same probe due to the sequence similarity between S mRNA and the whole or partial genome. Thus, our results lack sufficient detail contributing to the discussion of the controversial scientific topic of whether there is any possibility of SARS-CoV-2 genome integration into the host DNA (<xref ref-type="bibr" rid="ref41">Smits et al., 2021</xref>; <xref ref-type="bibr" rid="ref53">Zhang et al., 2021</xref>). Additionally, one of the significant differences in the S protein sequences of SARS-CoV and SARS-CoV-2 is the pat7 NLS motif. Our results showed that transient expression of S protein by a plasmid containing the full-length S protein DNA sequence in both primary NHBE cells and A549 cell line lead its wider subcellular distribution including nucleus. Whether S protein expression by the current vaccine platforms causes suboptimal expression of S protein on the cell surface due to the NLS remains to be determined.</p>
<p>In conclusion, the SARS-CoV-2&#x2009;S protein has a functional pat7 NLS &#x201C;PRRARSV,&#x201D; that results in one out of four S proteins translocating into the nucleus in infected cells. S Protein appears to shuttle S mRNA (possibly the genome) into the nucleus of the infected cells. Transient expression of full-length S protein in A549 cells reveals its nuclear translocation suggesting S protein&#x2019;s nuclear translocation is NLS-driven and independent of interacting with another viral protein. Thus NLS of the S protein may contribute to the evasion of the host immune response and is a novel feature of SARS-CoV-2.</p>
</sec>
<sec id="sec9" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="sec10">
<title>Cells and viruses</title>
<p>Primary normal human bronchial epithelial (NHBE) cells from healthy adults and high-risk adults (deidentified) were obtained from Dr. Kristina Bailey at the University of Nebraska Medical Center (UNMC) (Omaha, NE) under an approved material transfer agreement (MTA) between the University of North Dakota (UND) and UNMC (Omaha, NE). The protocol for obtaining cells was reviewed by the UNMC IRB and was determined to not constitute human subject research (#318-09-NH). In this study, we used cells from three donors: nonsmoker healthy adults (donors #1 and #2) and adult with chronic obstructive pulmonary disease (COPD) (donor #3). The protocols for subculturing primary NHBE cells were published previously (<xref ref-type="bibr" rid="ref28">Osan et al., 2020</xref>, <xref ref-type="bibr" rid="ref27">2021</xref>, <xref ref-type="bibr" rid="ref29">2022</xref>; <xref ref-type="bibr" rid="ref43">Talukdar et al., 2022</xref>). Human lung epithelial A549 cells was maintained in F-12 medium (Thermo Fisher Scientific) as described previously (<xref ref-type="bibr" rid="ref23">Mehedi et al., 2016</xref>). SARS-CoV-2 (USA/WA-CDC-WA1/2020 isolate, GenBank accession no. MN985325; kindly provided by CDC), SARS-CoV (Urbani strain, GenBank accession no. AY278741; kindly provided by Rocky Mountain Laboratories (RML), NIAID, NIH), and MERS-CoV (GenBank accession no. NC_019843.3; kindly provided by the Department of Viroscience, Erasmus Medical Center, Rotterdam, The Netherlands) were used for <italic>in vitro</italic> infections described below.</p>
</sec>
<sec id="sec11">
<title><italic>In silico</italic> analysis</title>
<p>We have used open-source web portals for different <italic>in silico</italic> analyses. 1. Constraint-based alignment tool for multiple protein sequences (COBALT)<xref rid="fn0005" ref-type="fn"><sup>1</sup></xref> was used for multiple sequence alignment. 2. PSORT II<xref rid="fn0006" ref-type="fn"><sup>2</sup></xref> was used for NLS prediction. 3. The RPIseq web portal<xref rid="fn0007" ref-type="fn"><sup>3</sup></xref> was used for RNA&#x2013;protein interactions.</p>
</sec>
<sec id="sec12">
<title>Highly differentiated pseudostratified bronchial airway epithelium</title>
<p>The protocols for differentiating primary NHBE cells to form a pseudostratified bronchial airway epithelium were published previously (<xref ref-type="bibr" rid="ref28">Osan et al., 2020</xref>, <xref ref-type="bibr" rid="ref27">2021</xref>, <xref ref-type="bibr" rid="ref29">2022</xref>; <xref ref-type="bibr" rid="ref43">Talukdar et al., 2022</xref>). Briefly, Transwells (6.5&#x2009;mm) with 0.4-&#x03BC;m-pore polyester membrane inserts (Corning Inc.) were coated with PureCol (Advanced BioMatrix) for 20&#x2009;min before cell seeding. NHBE cells (5&#x00D7;10^4) suspended in 100&#x2009;&#x03BC;L of complete airway epithelial cell (cAEC) medium [AEC medium (Promocell)&#x2009;+&#x2009;SupplementMix (Promocell)&#x2009;+&#x2009;1% penicillin&#x2013;streptomycin (V/V) (Thermo Fisher Scientific)&#x2009;+&#x2009;0.5% amphotericin B (V/V) (Thermo Fisher Scientific)] were seeded in the upper chamber of the Transwell. Then, 500&#x2009;&#x03BC;L of cAEC medium was added to the lower chamber of the Transwell. When the cells formed a confluent layer on the Transwell insert, the cAEC medium was removed from the upper chamber, and in the lower chamber, the cAEC medium was replaced with complete ALI medium [PneumaCult-ALI basal medium (Stemcell Technologies Inc.)&#x2009;+&#x2009;with the required supplements (Stemcell Technologies)&#x2009;+&#x2009;2% penicillin&#x2013;streptomycin (V/V)&#x2009;+&#x2009;1% amphotericin B (V/V)]. The complete ALI medium in the lower chamber was changed every day. The upper chamber was washed with 1x Dulbecco&#x2019;s phosphate-buffered saline (DPBS) (Thermo Fisher Scientific) once per week initially but more frequently when more mucus was observed during later days. All cells were differentiated for at least 4 weeks at 37&#x00B0;C in a 5% CO<sub>2</sub> incubator. We observed motile cilia in the differentiated airway epithelium similar to previously described (<xref ref-type="bibr" rid="ref28">Osan et al., 2020</xref>).</p>
</sec>
<sec id="sec13">
<title>Viral infection</title>
<p>All viral infection experiments were conducted in the high biocontainment facility at RML, NIAID, NIH, Hamilton, MT. After approximately 3&#x2009;weeks, the differentiated airway epithelium on Transwells was shipped to RML in an optimized transportation medium (<xref ref-type="bibr" rid="ref28">Osan et al., 2020</xref>, <xref ref-type="bibr" rid="ref29">2022</xref>), and the recovered cells were maintained in complete ALI medium for approximately 1 week before infection. For infection, the airway epithelium on Transwells was washed with 200&#x2009;&#x03BC;L of 1x PBS to remove mucus and were infected on the apical site with SARS-CoV-2, MERS-CoV, or SARS-CoV at a MOI of 0.1 in 100&#x2009;&#x03BC;L 1x PBS for 1&#x2009;h (at 37&#x00B0;C with 5% CO<sub>2</sub>). For mock infection, the Transwells were similarly incubated with 100&#x2009;&#x03BC;L 1x PBS without virus. The viral inoculum was then removed, and the epithelium on the Transwell was washed twice with 200&#x2009;&#x03BC;L of 1x PBS. Complete ALI medium (1,000&#x2009;&#x03BC;L) was added to the lower chamber of each Transwell, and the upper chamber was kept empty. Mock-infected and virus-infected Transwells were incubated for 4&#x2009;days at 37&#x00B0;C in an incubator with 5% CO<sub>2</sub> (<xref ref-type="bibr" rid="ref29">Osan et al., 2022</xref>).</p>
</sec>
<sec id="sec14">
<title>Paraformaldehyde (PFA) fixation and paraffin embedding</title>
<p>At 4&#x2009;days postinfection (DPI), 200&#x2009;&#x03BC;L of 1x PBS was added to the apical site of the Transwell for washing before PFA fixation. In the basal side of the Transwell inserts was 200&#x2009;&#x03BC;L of 1x PBS. For PFA fixation, 200&#x2009;&#x03BC;L of 4% PFA (Polysciences) was added to the upper chamber of the Transwells and incubated for 30&#x2009;min, and the Transwells were further maintained overnight in 4% PFA prior to removal from high biocontainment. The PFA fixation protocol was approved as an inactivation method for coronaviruses by the RML Institutional Biosafety Committee. The PFA-fixed airway epithelium was paraffin-embedded and sectioned at a thickness of 5&#x2009;&#x03BC;m for slide preparation as previously described (<xref ref-type="bibr" rid="ref27">Osan et al., 2021</xref>).</p>
</sec>
<sec id="sec15">
<title>Simultaneous detection of S mRNA and S protein</title>
<p>Slides with 5&#x2009;&#x03BC;m sections were first deparaffinized by incubation in a Coplin jar as follows: 1. Histo-Clear for 5&#x2009;min, two times; 2. 100% ethanol for 5&#x2009;min, three times; 3. 95% ethanol for 5&#x2009;min, 4. 70% ethanol for 5&#x2009;min, and 5. distilled water for 5&#x2009;min. The deparaffinized slides were immediately incubated in 0.5% Triton X-100 in 1x PBS for 30&#x2009;min. The slides were washed three times with 1X PBST (1x PBS with Tween 20) or 1x PBS for 5&#x2009;min. A hydrophobic barrier was drawn around the 5&#x2009;&#x03BC;m section on the slides by using an Immedge Hydrophobic Barrier Pen. To reduce nonspecific antibody binding, the section was blocked with 10% goat serum (Vector Laboratories) in 1x PBST for 2&#x2009;h at 4&#x00B0;C. The slides were then incubated with viral protein-specific primary antibody solution in 1x PBST (e.g., SARS-CoV/SARS-CoV-2&#x2009;S protein-specific rabbit polyclonal antibody at a 1:100 dilution, SARS-CoV/SARS-CoV-2&#x2009;N protein-specific mouse monoclonal antibody at a 1:100 dilution, or MERS-CoV N protein-specific mouse monoclonal antibody at a 1:100 dilution) (<xref ref-type="bibr" rid="ref27">Osan et al., 2021</xref>) overnight at 4&#x00B0;C. The slides were then incubated with the corresponding secondary antibody solution (anti-mouse or anti-rabbit AF488 or AF647, Thermo Fisher Scientific) in 1x PBST for 2&#x2009;h at room temperature. We then stained the nuclei with DAPI reagent (Advanced Cell Diagnostics) or used RNAscope multiplex V2 to detect SARS-CoV-2&#x2009;S mRNA (Probe V-nCoV2019-S) according to the manufacturer&#x2019;s instructions (Advanced Cell Diagnostics). The sections were mounted on Tech-Med microscope slides (Thomas Fisher Scientific) using ProLong-Gold antifade mounting medium (Thermo Fisher Scientific).</p>
</sec>
<sec id="sec16">
<title>Imaging and image analysis</title>
<p>For the immunofluorescence (IFA)-based detection of SARS-CoV-2/ SARS-CoV S and N protein were detected by using S-specific rabbit polyclonal antibody (Thermo Fisher Scientific) and N-specific mouse monoclonal antibody (Thermo Fisher Scientific), respectively. Similarly, MERS-CoV N protein was detected using N-specific mouse monoclonal antibody (Sino Biological). Similarly, calnexin and lamin B1 were detected using calnexin-specific mouse monoclonal antibody (Antibody) and lamin B1 specific mouse monoclonal antibody (Abcam), respectively. The slides were then incubated with the corresponding secondary antibody solution (anti-mouse or anti-rabbit AF488 or AF647, Thermo Fisher Scientific). For primary antibody we used 1:1000 dilution, whereas we used 1:200 dilution for secondary anybody incubation. Rhodamine Phalloidin (Cytoskeleton Inc.) (1:500 dilution) and DAPI (Thermo Fisher Scientific) (1 drop in 1,000&#x2009;&#x03BC;L) were used for staining F-actin and nucleus, respectively. For mounting coverslip on a cover glass, we used ProLong Gold Antifade Msounting medium (Thermo Fisher Scientific). The images were taken under an Olympus FluoView laser scanning confocal microscope (Olympus FV3000) enabled with a 60X objective (Olympus), a Leica Stellaris confocal microscope (Leica Microsystem) using a 63x oil objective or a Leica DMI8 epifluorescence microscope (Leica Microsystem). The images were then deconvolved using Huygen Essential deconvolution software (Scientific Volume Imaging). The surface rendering function of Imaris image processing software (Oxford Instruments) was used. The images were also analyzed for spot-to-spot colocalization by Imaris. Where applicable, images taken under a Leica DMI8 microscope were processed using 3D deconvolution and 3D view modules in LASX software (Leica Microsystem). For figure preparation, Prism version 9 (GraphPad) and Adobe Photoshop (Creative Cloud) software were used.</p>
</sec>
<sec id="sec17">
<title>Transient transfection</title>
<p>NHBE cells (two independent donors #1 and #2) were seeded on 24 well plate in cAEC medium at 37&#x00B0;C in a 5% CO<sub>2</sub> incubator. Cells were then transfected with SARS-COV-2 Spike (S) expressing plasmid (generous gift from Shanna S Leventhal and David M Hawman) (<xref ref-type="bibr" rid="ref20">Leventhal et al., 2021</xref>) (0.5&#x2009;&#x03BC;g) using TransfeX transfection reagent (ATCC) according to the manufacturer instructions. Similarly, A549 cells were seeded on a 24 well plate in F-12 medium at 37&#x00B0;C in a 5% CO<sub>2</sub> incubator. For imaging purpose, a coverslip was previously added onto the well of 24-well plate before seeding cells. The cells were transfected with SARS-COV-2 Spike (S) expressing plasmid (0.5&#x2009;&#x03BC;g) using TransLT-1 transfection reagent (Mirus Bio LLC) according to the manufacturer instructions. For control, eGFP in pCAGGS plasmid (generous gift from Dr. Thomas Hoenen) was transfected similarly. For mock-transfection, cells were treated similarly without any plasmid.</p>
</sec>
<sec id="sec18">
<title>Nuclear and cytoplasmic fractionation and Western blotting</title>
<p>Old medium was removed, and cells were washed at 1x PBS. Both cytoplasmic and nuclear portion from the S-transfected or mock-transfected A549 cells were collected using nuclear fractionating kit according to the manufacturer instructions. Around 30 ul of cytoplasmic and nuclear portions were run 4&#x2013;12% bis-tris gel (Thermo Fisher Scientific) and followed by transferred on polyvinylidene fluoride (PVDF) membrane (Thermo Fisher Scientific) using iblot (Thermo Fisher Scientific). The membrane was blocked using Li-Cor blocking buffer (LI-COR Biosciences). For SARS-CoV-2&#x2009;S protein was detected using SARS-CoV/SARS-CoV-2&#x2009;S protein-specific rabbit polyclonal antibody (Thermo Fisher Scientific) at a 1:2500 dilution. Lamin A and C were detected protein-specific rabbit polyclonal antibody (Abcam) (molecular weight around 75&#x2009;kDa and lower, respectively) at a 1:5000 dilution. Cdc42 were detected protein-specific rabbit polyclonal antibody (Cell Signaling Inc) (molecular weight around 20&#x2009;kDa) at a 1:1000 dilution. A sequential different primary and secondary antibodies (e.g., anti-rabbit goat IRDye 680RD or ant-rabbit goat IRDye 800CW incubation for different protein detection on the same gel. For accuracy of protein detection, individual protein specific gel was also generated.</p>
</sec>
</sec>
<sec id="sec19" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref rid="SM1" ref-type="supplementary-material">Supplementary material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="sec20">
<title>Author contributions</title>
<p>MM conceived the project and designed all the experiments, analyzed (<italic>in silico</italic>) the viral genome and protein sequences, and prepared the figures and wrote and edited the manuscript. KB provided the primary cells. FF performed the viral infection work. KJ, SS, and MM performed all staining for detection. MM and SS generated the microscopic images. JK and MM processed and quantified images. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="sec21" sec-type="funding-information">
<title>Funding</title>
<p>This work was funded by the NIH/NIGMS awards P20GM113123 and T34GM122835, VA grant 101-BX005413 and partially by the Intramural Research Program, NIAID, NIH. The content is solely the responsibility of the authors and does not necessarily represent the official views of the NIH.</p>
</sec>
<sec id="conf1" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="sec100" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack>
<p>We are thankful to the MARC U-STAR program at UND for supporting the undergraduate students SS and KJ. We are grateful to Jaspreet K. Osan for helping with primary cell culture work. We are also grateful to Heinz Feldmann of the Laboratory of Virology, NIAID, NIH for support with material and infections. We are thankful to Shanna S. Leventhal and David W. Hawman for sharing S protein expressing recombinant plasmid. In addition, we thank the Microscopy Core (UND, Grand Forks), which is funded by NIH P20GM103442, of the INBRE program for providing access to an Olympus FV300 confocal microscope. Histological services were provided by the UND Histology Core, which is supported by the NIH/NIGMS awards P20GM113123, U54G M128729, and UND SMHS funds. We also thank the Imaging Core (UND, Grand Forks), which is funded by NIH P20GM113123, NIH U54GM128729, and UNDSMHS funds, for IMARIS image analyses.</p>
</ack>
<sec id="sec23" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2023.1073789/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fmicb.2023.1073789/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_2.PDF" id="SM2" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_1.TIFF" id="SM3" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_2.TIFF" id="SM4" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_3.TIFF" id="SM5" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_4.TIFF" id="SM6" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_5.TIFF" id="SM7" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_6.TIFF" id="SM8" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_7.TIFF" id="SM9" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_8.TIFF" id="SM10" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_9.TIFF" id="SM11" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Addetia</surname> <given-names>A.</given-names></name> <name><surname>Lieberman</surname> <given-names>N. A. P.</given-names></name> <name><surname>Phung</surname> <given-names>Q.</given-names></name> <name><surname>Hsiang</surname> <given-names>T. Y.</given-names></name> <name><surname>Xie</surname> <given-names>H.</given-names></name> <name><surname>Roychoudhury</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>SARS-CoV-2 ORF6 disrupts bidirectional Nucleocytoplasmic transport through interactions with Rae1 and Nup98</article-title>. <source>mBio</source> <volume>12</volume>.</citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Andersen</surname> <given-names>K. G.</given-names></name> <name><surname>Rambaut</surname> <given-names>A.</given-names></name> <name><surname>Lipkin</surname> <given-names>W. I.</given-names></name> <name><surname>Holmes</surname> <given-names>E. C.</given-names></name> <name><surname>Garry</surname> <given-names>R. F.</given-names></name></person-group> (<year>2020</year>). <article-title>The proximal origin of SARS-CoV-2</article-title>. <source>Nat. Med.</source> <volume>26</volume>, <fpage>450</fpage>&#x2013;<lpage>452</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41591-020-0820-9</pub-id>, PMID: <pub-id pub-id-type="pmid">32284615</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Boisvert</surname> <given-names>M.</given-names></name> <name><surname>Bouchard-Levesque</surname> <given-names>V.</given-names></name> <name><surname>Fernandes</surname> <given-names>S.</given-names></name> <name><surname>Tijssen</surname> <given-names>P.</given-names></name></person-group> (<year>2014</year>). <article-title>Classic nuclear localization signals and a novel nuclear localization motif are required for nuclear transport of porcine parvovirus capsid proteins</article-title>. <source>J. Virol.</source> <volume>88</volume>, <fpage>11748</fpage>&#x2013;<lpage>11759</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JVI.01717-14</pub-id>, PMID: <pub-id pub-id-type="pmid">25078698</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bojkova</surname> <given-names>D.</given-names></name> <name><surname>Klann</surname> <given-names>K.</given-names></name> <name><surname>Koch</surname> <given-names>B.</given-names></name> <name><surname>Widera</surname> <given-names>M.</given-names></name> <name><surname>Krause</surname> <given-names>D.</given-names></name> <name><surname>Ciesek</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Proteomics of SARS-CoV-2-infected host cells reveals therapy targets</article-title>. <source>Nature</source> <volume>583</volume>, <fpage>469</fpage>&#x2013;<lpage>472</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-020-2332-7</pub-id>, PMID: <pub-id pub-id-type="pmid">32408336</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chan</surname> <given-names>Y. A.</given-names></name> <name><surname>Zhan</surname> <given-names>S. H.</given-names></name></person-group> (<year>2022</year>). <article-title>The emergence of the spike Furin cleavage site in SARS-CoV-2</article-title>. <source>Mol. Biol. Evol.</source> <volume>39</volume>.</citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Conceicao</surname> <given-names>C.</given-names></name> <name><surname>Thakur</surname> <given-names>N.</given-names></name> <name><surname>Human</surname> <given-names>S.</given-names></name> <name><surname>Kelly</surname> <given-names>J. T.</given-names></name> <name><surname>Logan</surname> <given-names>L.</given-names></name> <name><surname>Bialy</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>The SARS-CoV-2 spike protein has a broad tropism for mammalian ACE2 proteins</article-title>. <source>PLoS Biol.</source> <volume>18</volume>:<fpage>e3001016</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pbio.3001016</pub-id>, PMID: <pub-id pub-id-type="pmid">33347434</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cubuk</surname> <given-names>J.</given-names></name> <name><surname>Alston</surname> <given-names>J. J.</given-names></name> <name><surname>Incicco</surname> <given-names>J. J.</given-names></name> <name><surname>Singh</surname> <given-names>S.</given-names></name> <name><surname>Stuchell-Brereton</surname> <given-names>M. D.</given-names></name> <name><surname>Ward</surname> <given-names>M. D.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>The SARS-CoV-2 nucleocapsid protein is dynamic, disordered, and phase separates with RNA</article-title>. <source>Nat. Commun.</source> <volume>12</volume>:<fpage>1936</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-021-21953-3</pub-id>, PMID: <pub-id pub-id-type="pmid">33782395</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dapoian</surname> <given-names>A. T.</given-names></name> <name><surname>Gomes</surname> <given-names>A. M.</given-names></name> <name><surname>Oliveira</surname> <given-names>R. J. N.</given-names></name> <name><surname>Silva</surname> <given-names>J. L.</given-names></name></person-group> (<year>1996</year>). <article-title>Migration of vesicular stomatitis virus glycoprotein to the nucleus of infected cells</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>93</volume>, <fpage>8268</fpage>&#x2013;<lpage>8273</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.93.16.8268</pub-id>, PMID: <pub-id pub-id-type="pmid">8710859</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dinesh</surname> <given-names>D. C.</given-names></name> <name><surname>Chalupska</surname> <given-names>D.</given-names></name> <name><surname>Silhan</surname> <given-names>J.</given-names></name> <name><surname>Koutna</surname> <given-names>E.</given-names></name> <name><surname>Nencka</surname> <given-names>R.</given-names></name> <name><surname>Veverka</surname> <given-names>V.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Structural basis of RNA recognition by the SARS-CoV-2 nucleocapsid phosphoprotein</article-title>. <source>PLoS Pathog.</source> <volume>16</volume>:<fpage>e1009100</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.ppat.1009100</pub-id>, PMID: <pub-id pub-id-type="pmid">33264373</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Finkel</surname> <given-names>Y.</given-names></name> <name><surname>Mizrahi</surname> <given-names>O.</given-names></name> <name><surname>Nachshon</surname> <given-names>A.</given-names></name> <name><surname>Weingarten-Gabbay</surname> <given-names>S.</given-names></name> <name><surname>Morgenstern</surname> <given-names>D.</given-names></name> <name><surname>Yahalom-Ronen</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>The coding capacity of SARS-CoV-2</article-title>. <source>Nature</source> <volume>589</volume>, <fpage>125</fpage>&#x2013;<lpage>130</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-020-2739-1</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gibson</surname> <given-names>C. A.</given-names></name> <name><surname>Daniels</surname> <given-names>R. S.</given-names></name> <name><surname>Oxford</surname> <given-names>J. S.</given-names></name> <name><surname>Mccauley</surname> <given-names>J. W.</given-names></name></person-group> (<year>1992</year>). <article-title>Sequence analysis of the equine H7 influenza virus haemagglutinin gene</article-title>. <source>Virus Res.</source> <volume>22</volume>, <fpage>93</fpage>&#x2013;<lpage>106</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0168-1702(92)90037-A</pub-id>, PMID: <pub-id pub-id-type="pmid">1566601</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gussow</surname> <given-names>A. B.</given-names></name> <name><surname>Auslander</surname> <given-names>N.</given-names></name> <name><surname>Faure</surname> <given-names>G.</given-names></name> <name><surname>Wolf</surname> <given-names>Y. I.</given-names></name> <name><surname>Zhang</surname> <given-names>F.</given-names></name> <name><surname>Koonin</surname> <given-names>E. V.</given-names></name></person-group> (<year>2020</year>). <article-title>Genomic determinants of pathogenicity in SARS-CoV-2 and other human coronaviruses</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>117</volume>, <fpage>15193</fpage>&#x2013;<lpage>15199</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.2008176117</pub-id>, PMID: <pub-id pub-id-type="pmid">32522874</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Harrow</surname> <given-names>J.</given-names></name> <name><surname>Nagy</surname> <given-names>A.</given-names></name> <name><surname>Reymond</surname> <given-names>A.</given-names></name> <name><surname>Alioto</surname> <given-names>T.</given-names></name> <name><surname>Patthy</surname> <given-names>L.</given-names></name> <name><surname>Antonarakis</surname> <given-names>S. E.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>Identifying protein-coding genes in genomic sequences</article-title>. <source>Genome Biol.</source> <volume>10</volume>:<fpage>201</fpage>. doi: <pub-id pub-id-type="doi">10.1186/gb-2009-10-1-201</pub-id>, PMID: <pub-id pub-id-type="pmid">19226436</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hicks</surname> <given-names>G. R.</given-names></name> <name><surname>Raikhel</surname> <given-names>N. V.</given-names></name></person-group> (<year>1995</year>). <article-title>Protein import into the nucleus: an integrated view</article-title>. <source>Annu. Rev. Cell Dev. Biol.</source> <volume>11</volume>, <fpage>155</fpage>&#x2013;<lpage>188</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev.cb.11.110195.001103</pub-id>, PMID: <pub-id pub-id-type="pmid">8689555</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hoffmann</surname> <given-names>M.</given-names></name> <name><surname>Kleine-Weber</surname> <given-names>H.</given-names></name> <name><surname>Schroeder</surname> <given-names>S.</given-names></name> <name><surname>Kruger</surname> <given-names>N.</given-names></name> <name><surname>Herrler</surname> <given-names>T.</given-names></name> <name><surname>Erichsen</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>SARS-CoV-2 cell entry depends on ACE2 and TMPRSS2 and is blocked by a clinically proven protease inhibitor</article-title>. <source>Cells</source> <volume>181</volume>:<fpage>e278</fpage>, <fpage>271</fpage>&#x2013;<lpage>280.e8</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2020.02.052</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>T.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Zhao</surname> <given-names>M.</given-names></name> <name><surname>Zhuang</surname> <given-names>Q.</given-names></name> <name><surname>Xu</surname> <given-names>L.</given-names></name> <name><surname>He</surname> <given-names>Q.</given-names></name></person-group> (<year>2020</year>). <article-title>A comparison of COVID-19 SARS and MERS</article-title>. <source>PeerJ</source> <volume>8</volume>:<fpage>e9725</fpage>. doi: <pub-id pub-id-type="doi">10.7717/peerj.9725</pub-id>, PMID: <pub-id pub-id-type="pmid">32879801</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jia</surname> <given-names>H. P.</given-names></name> <name><surname>Look</surname> <given-names>D. C.</given-names></name> <name><surname>Shi</surname> <given-names>L.</given-names></name> <name><surname>Hickey</surname> <given-names>M.</given-names></name> <name><surname>Pewe</surname> <given-names>L.</given-names></name> <name><surname>Netland</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2005</year>). <article-title>ACE2 receptor expression and severe acute respiratory syndrome coronavirus infection depend on differentiation of human airway epithelia</article-title>. <source>J. Virol.</source> <volume>79</volume>, <fpage>14614</fpage>&#x2013;<lpage>14621</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JVI.79.23.14614-14621.2005</pub-id>, PMID: <pub-id pub-id-type="pmid">16282461</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Klimstra</surname> <given-names>W. B.</given-names></name> <name><surname>Heidner</surname> <given-names>H. W.</given-names></name> <name><surname>Johnston</surname> <given-names>R. E.</given-names></name></person-group> (<year>1999</year>). <article-title>The furin protease cleavage recognition sequence of Sindbis virus PE2 can mediate virion attachment to cell surface heparan sulfate</article-title>. <source>J. Virol.</source> <volume>73</volume>, <fpage>6299</fpage>&#x2013;<lpage>6306</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JVI.73.8.6299-6306.1999</pub-id>, PMID: <pub-id pub-id-type="pmid">10400721</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krysan</surname> <given-names>D. J.</given-names></name> <name><surname>Rockwell</surname> <given-names>N. C.</given-names></name> <name><surname>Fuller</surname> <given-names>R. S.</given-names></name></person-group> (<year>1999</year>). <article-title>Quantitative characterization of furin specificity. Energetics of substrate discrimination using an internally consistent set of hexapeptidyl methylcoumarinamides</article-title>. <source>J. Biol. Chem.</source> <volume>274</volume>, <fpage>23229</fpage>&#x2013;<lpage>23234</lpage>. doi: <pub-id pub-id-type="doi">10.1074/jbc.274.33.23229</pub-id>, PMID: <pub-id pub-id-type="pmid">10438496</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leventhal</surname> <given-names>S. S.</given-names></name> <name><surname>Clancy</surname> <given-names>C.</given-names></name> <name><surname>Erasmus</surname> <given-names>J.</given-names></name> <name><surname>Feldmann</surname> <given-names>H.</given-names></name> <name><surname>Hawman</surname> <given-names>D. W.</given-names></name></person-group> (<year>2021</year>). <article-title>An intramuscular DNA vaccine for SARS-CoV-2 decreases viral lung load but not lung pathology in Syrian hamsters</article-title>. <source>Microorganisms</source> <volume>9</volume>:<fpage>1040</fpage>. doi: <pub-id pub-id-type="doi">10.3390/microorganisms9051040</pub-id>, PMID: <pub-id pub-id-type="pmid">34065996</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Xie</surname> <given-names>W.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Xiong</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>S.</given-names></name> <name><surname>Han</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>A comparative overview of COVID-19, MERS and SARS: review article</article-title>. <source>Int. J. Surg.</source> <volume>81</volume>, <fpage>1</fpage>&#x2013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ijsu.2020.07.032</pub-id>, PMID: <pub-id pub-id-type="pmid">32730205</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martinez-Flores</surname> <given-names>D.</given-names></name> <name><surname>Zepeda-Cervantes</surname> <given-names>J.</given-names></name> <name><surname>Cruz-Resendiz</surname> <given-names>A.</given-names></name> <name><surname>Aguirre-Sampieri</surname> <given-names>S.</given-names></name> <name><surname>Sampieri</surname> <given-names>A.</given-names></name> <name><surname>Vaca</surname> <given-names>L.</given-names></name></person-group> (<year>2021</year>). <article-title>SARS-CoV-2 vaccines based on the spike glycoprotein and implications of new viral variants</article-title>. <source>Front. Immunol.</source> <volume>12</volume>:<fpage>701501</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fimmu.2021.701501</pub-id>, PMID: <pub-id pub-id-type="pmid">34322129</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mehedi</surname> <given-names>M.</given-names></name> <name><surname>Mccarty</surname> <given-names>T.</given-names></name> <name><surname>Martin</surname> <given-names>S. E.</given-names></name> <name><surname>Le Nouen</surname> <given-names>C.</given-names></name> <name><surname>Buehler</surname> <given-names>E.</given-names></name> <name><surname>Chen</surname> <given-names>Y. C.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Actin-related protein 2 (ARP2) and virus-induced Filopodia facilitate Human respiratory syncytial virus spread</article-title>. <source>PLoS Pathog.</source> <volume>12</volume>:<fpage>e1006062</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.ppat.1006062</pub-id>, PMID: <pub-id pub-id-type="pmid">27926942</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Muppirala</surname> <given-names>U. K.</given-names></name> <name><surname>Honavar</surname> <given-names>V. G.</given-names></name> <name><surname>Dobbs</surname> <given-names>D.</given-names></name></person-group> (<year>2011</year>). <article-title>Predicting RNA-protein interactions using only sequence information</article-title>. <source>BMC Bioinform.</source> <volume>12</volume>:<fpage>489</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2105-12-489</pub-id>, PMID: <pub-id pub-id-type="pmid">22192482</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nakai</surname> <given-names>K.</given-names></name> <name><surname>Horton</surname> <given-names>P.</given-names></name></person-group> (<year>1999</year>). <article-title>PSORT: a program for detecting sorting signals in proteins and predicting their subcellular localization</article-title>. <source>Trends Biochem. Sci.</source> <volume>24</volume>, <fpage>34</fpage>&#x2013;<lpage>35</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0968-0004(98)01336-X</pub-id>, PMID: <pub-id pub-id-type="pmid">10087920</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ord</surname> <given-names>M.</given-names></name> <name><surname>Faustova</surname> <given-names>I.</given-names></name> <name><surname>Loog</surname> <given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>The sequence at spike S1/S2 site enables cleavage by furin and phospho-regulation in SARS-CoV2 but not in SARS-CoV1 or MERS-CoV</article-title>. <source>Sci. Rep.</source> <volume>10</volume>:<fpage>16944</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-020-74101-0</pub-id>, PMID: <pub-id pub-id-type="pmid">33037310</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Osan</surname> <given-names>J. K.</given-names></name> <name><surname>Demontigny</surname> <given-names>B. A.</given-names></name> <name><surname>Mehedi</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>Immunohistochemistry for protein detection in PFA-fixed paraffin-embedded SARS-CoV-2-infected COPD airway epithelium</article-title>. <source>STAR Protoc.</source> <volume>2</volume>:<fpage>100663</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.xpro.2021.100663</pub-id>, PMID: <pub-id pub-id-type="pmid">34250510</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Osan</surname> <given-names>J. K.</given-names></name> <name><surname>Talukdar</surname> <given-names>S. N.</given-names></name> <name><surname>Feldmann</surname> <given-names>F.</given-names></name> <name><surname>Ann Demontigny</surname> <given-names>B.</given-names></name> <name><surname>Jerome</surname> <given-names>K.</given-names></name> <name><surname>Bailey</surname> <given-names>K. L.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Goblet cell hyperplasia increases SARS-CoV-2 infection in COPD. bioRxiv</article-title>.</citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Osan</surname> <given-names>J.</given-names></name> <name><surname>Talukdar</surname> <given-names>S. N.</given-names></name> <name><surname>Feldmann</surname> <given-names>F.</given-names></name> <name><surname>Demontigny</surname> <given-names>B. A.</given-names></name> <name><surname>Jerome</surname> <given-names>K.</given-names></name> <name><surname>Bailey</surname> <given-names>K. L.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Goblet cell hyperplasia increases SARS-CoV-2 infection in chronic obstructive pulmonary disease</article-title>. <source>Microbiol. Spectr.</source> <volume>10</volume>. doi: <pub-id pub-id-type="doi">10.1128/spectrum.00459-22</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ozawa</surname> <given-names>M.</given-names></name> <name><surname>Fujii</surname> <given-names>K.</given-names></name> <name><surname>Muramoto</surname> <given-names>Y.</given-names></name> <name><surname>Yamada</surname> <given-names>S.</given-names></name> <name><surname>Yamayoshi</surname> <given-names>S.</given-names></name> <name><surname>Takada</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2007</year>). <article-title>Contributions of two nuclear localization signals of influenza a virus nucleoprotein to viral replication</article-title>. <source>J. Virol.</source> <volume>81</volume>, <fpage>30</fpage>&#x2013;<lpage>41</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JVI.01434-06</pub-id>, PMID: <pub-id pub-id-type="pmid">17050598</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Papadopoulos</surname> <given-names>J. S.</given-names></name> <name><surname>Agarwala</surname> <given-names>R.</given-names></name></person-group> (<year>2007</year>). <article-title>COBALT: constraint-based alignment tool for multiple protein sequences</article-title>. <source>Bioinformatics</source> <volume>23</volume>, <fpage>1073</fpage>&#x2013;<lpage>1079</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btm076</pub-id>, PMID: <pub-id pub-id-type="pmid">17332019</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parent</surname> <given-names>L. J.</given-names></name></person-group> (<year>2011</year>). <article-title>New insights into the nuclear localization of retroviral gag proteins</article-title>. <source>Nucleus</source> <volume>2</volume>, <fpage>92</fpage>&#x2013;<lpage>97</lpage>. doi: <pub-id pub-id-type="doi">10.4161/nucl.2.2.15018</pub-id>, PMID: <pub-id pub-id-type="pmid">21738831</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pasternak</surname> <given-names>A. O.</given-names></name> <name><surname>Spaan</surname> <given-names>W. J. M.</given-names></name> <name><surname>Snijder</surname> <given-names>E. J.</given-names></name></person-group> (<year>2006</year>). <article-title>Nidovirus transcription: how to make sense..?</article-title> <source>J. Gen. Virol.</source> <volume>87</volume>, <fpage>1403</fpage>&#x2013;<lpage>1421</lpage>. doi: <pub-id pub-id-type="doi">10.1099/vir.0.81611-0</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peacock</surname> <given-names>T. P.</given-names></name> <name><surname>Goldhill</surname> <given-names>D. H.</given-names></name> <name><surname>Zhou</surname> <given-names>J.</given-names></name> <name><surname>Baillon</surname> <given-names>L.</given-names></name> <name><surname>Frise</surname> <given-names>R.</given-names></name> <name><surname>Swann</surname> <given-names>O. C.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>The furin cleavage site in the SARS-CoV-2 spike protein is required for transmission in ferrets</article-title>. <source>Nat. Microbiol.</source> <volume>6</volume>, <fpage>899</fpage>&#x2013;<lpage>909</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41564-021-00908-w</pub-id>, PMID: <pub-id pub-id-type="pmid">33907312</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Perlman</surname> <given-names>S.</given-names></name> <name><surname>Netland</surname> <given-names>J.</given-names></name></person-group> (<year>2009</year>). <article-title>Coronaviruses post-SARS: update on replication and pathogenesis</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>7</volume>, <fpage>439</fpage>&#x2013;<lpage>450</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrmicro2147</pub-id>, PMID: <pub-id pub-id-type="pmid">19430490</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Pradhan</surname> <given-names>P.</given-names></name> <name><surname>Pandey</surname> <given-names>A. K.</given-names></name> <name><surname>Mishra</surname> <given-names>A.</given-names></name> <name><surname>Gupta</surname> <given-names>P.</given-names></name> <name><surname>Tripathi</surname> <given-names>P. K.</given-names></name> <name><surname>Menon</surname> <given-names>M. B.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Uncanny similarity of unique inserts in the 2019-nCoV spike protein to HIV-1 gp120 and gag</article-title>. <comment>BioRxiv</comment>.</citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raj</surname> <given-names>V. S.</given-names></name> <name><surname>Mou</surname> <given-names>H.</given-names></name> <name><surname>Smits</surname> <given-names>S. L.</given-names></name> <name><surname>Dekkers</surname> <given-names>D. H.</given-names></name> <name><surname>Muller</surname> <given-names>M. A.</given-names></name> <name><surname>Dijkman</surname> <given-names>R.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Dipeptidyl peptidase 4 is a functional receptor for the emerging human coronavirus-EMC</article-title>. <source>Nature</source> <volume>495</volume>, <fpage>251</fpage>&#x2013;<lpage>254</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nature12005</pub-id>, PMID: <pub-id pub-id-type="pmid">23486063</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Robbins</surname> <given-names>J.</given-names></name> <name><surname>Dilwortht</surname> <given-names>S. M.</given-names></name> <name><surname>Laskey</surname> <given-names>R. A.</given-names></name> <name><surname>Dingwall</surname> <given-names>C.</given-names></name></person-group> (<year>1991</year>). <article-title>Two interdependent basic domains in nucleoplasmin nuclear targeting sequence: identification of a class of bipartite nuclear targeting sequence</article-title>. <source>Cells</source> <volume>64</volume>, <fpage>615</fpage>&#x2013;<lpage>623</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0092-8674(91)90245-T</pub-id>, PMID: <pub-id pub-id-type="pmid">1991323</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rowland</surname> <given-names>R. R.</given-names></name> <name><surname>Chauhan</surname> <given-names>V.</given-names></name> <name><surname>Fang</surname> <given-names>Y.</given-names></name> <name><surname>Pekosz</surname> <given-names>A.</given-names></name> <name><surname>Kerrigan</surname> <given-names>M.</given-names></name> <name><surname>Burton</surname> <given-names>M. D.</given-names></name></person-group> (<year>2005</year>). <article-title>Intracellular localization of the severe acute respiratory syndrome coronavirus nucleocapsid protein: absence of nucleolar accumulation during infection and after expression as a recombinant protein in vero cells</article-title>. <source>J. Virol.</source> <volume>79</volume>, <fpage>11507</fpage>&#x2013;<lpage>11512</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JVI.79.17.11507-11512.2005</pub-id>, PMID: <pub-id pub-id-type="pmid">16103202</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schmidt</surname> <given-names>N.</given-names></name> <name><surname>Lareau</surname> <given-names>C. A.</given-names></name> <name><surname>Keshishian</surname> <given-names>H.</given-names></name> <name><surname>Ganskih</surname> <given-names>S.</given-names></name> <name><surname>Schneider</surname> <given-names>C.</given-names></name> <name><surname>Hennig</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>The SARS-CoV-2 RNA-protein interactome in infected human cells</article-title>. <source>Nat. Microbiol.</source> <volume>6</volume>, <fpage>339</fpage>&#x2013;<lpage>353</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41564-020-00846-z</pub-id>, PMID: <pub-id pub-id-type="pmid">33349665</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Smits</surname> <given-names>N.</given-names></name> <name><surname>Rasmussen</surname> <given-names>J.</given-names></name> <name><surname>Bodea</surname> <given-names>G.O.</given-names></name> <name><surname>Amarilla</surname> <given-names>A. A.</given-names></name> <name><surname>Gerdes</surname> <given-names>P.</given-names></name> <name><surname>Sanchez-Luque</surname> <given-names>F. J.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Human genome integration of SARS-CoV-2 contradicted by long-read sequencing. bioRxiv</article-title>.</citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sola</surname> <given-names>I.</given-names></name> <name><surname>Almazan</surname> <given-names>F.</given-names></name> <name><surname>Zuniga</surname> <given-names>S.</given-names></name> <name><surname>Enjuanes</surname> <given-names>L.</given-names></name></person-group> (<year>2015</year>). <article-title>Continuous and discontinuous RNA synthesis in coronaviruses</article-title>. <source>Annu. Rev. Virol.</source> <volume>2</volume>, <fpage>265</fpage>&#x2013;<lpage>288</lpage>. doi: <pub-id pub-id-type="doi">10.1146/annurev-virology-100114-055218</pub-id>, PMID: <pub-id pub-id-type="pmid">26958916</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Talukdar</surname> <given-names>S. N.</given-names></name> <name><surname>Osan</surname> <given-names>J.</given-names></name> <name><surname>Ryan</surname> <given-names>K.</given-names></name> <name><surname>Grove</surname> <given-names>B.</given-names></name> <name><surname>Perley</surname> <given-names>D.</given-names></name> <name><surname>Kumar</surname> <given-names>B. D.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>RSV-induced expanded ciliated cells contribute to Bronchial Wall thickening</article-title> <comment>bioRxiv</comment>.</citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tian</surname> <given-names>S.</given-names></name> <name><surname>Huang</surname> <given-names>Q.</given-names></name> <name><surname>Fang</surname> <given-names>Y.</given-names></name> <name><surname>Wu</surname> <given-names>J.</given-names></name></person-group> (<year>2011</year>). <article-title>FurinDB: a database of 20-residue furin cleavage site motifs, substrates and their associated drugs</article-title>. <source>Int. J. Mol. Sci.</source> <volume>12</volume>, <fpage>1060</fpage>&#x2013;<lpage>1065</lpage>. doi: <pub-id pub-id-type="doi">10.3390/ijms12021060</pub-id>, PMID: <pub-id pub-id-type="pmid">21541042</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Timani</surname> <given-names>K. A.</given-names></name> <name><surname>Liao</surname> <given-names>Q.</given-names></name> <name><surname>Ye</surname> <given-names>L.</given-names></name> <name><surname>Zeng</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Zheng</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2005</year>). <article-title>Nuclear/nucleolar localization properties of C-terminal nucleocapsid protein of SARS coronavirus</article-title>. <source>Virus Res.</source> <volume>114</volume>, <fpage>23</fpage>&#x2013;<lpage>34</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.virusres.2005.05.007</pub-id>, PMID: <pub-id pub-id-type="pmid">15992957</pub-id></citation></ref>
<ref id="ref46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vargas</surname> <given-names>D. Y.</given-names></name> <name><surname>Raj</surname> <given-names>A.</given-names></name> <name><surname>Marras</surname> <given-names>S. A.</given-names></name> <name><surname>Kramer</surname> <given-names>F. R.</given-names></name> <name><surname>Tyagi</surname> <given-names>S.</given-names></name></person-group> (<year>2005</year>). <article-title>Mechanism of mRNA transport in the nucleus</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>102</volume>, <fpage>17008</fpage>&#x2013;<lpage>17013</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.0505580102</pub-id>, PMID: <pub-id pub-id-type="pmid">16284251</pub-id></citation></ref>
<ref id="ref47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Walls</surname> <given-names>A. C.</given-names></name> <name><surname>Park</surname> <given-names>Y. J.</given-names></name> <name><surname>Tortorici</surname> <given-names>M. A.</given-names></name> <name><surname>Wall</surname> <given-names>A.</given-names></name> <name><surname>Mcguire</surname> <given-names>A. T.</given-names></name> <name><surname>Veesler</surname> <given-names>D.</given-names></name></person-group> (<year>2020</year>). <article-title>Structure, function, and antigenicity of the SARS-CoV-2 spike glycoprotein</article-title>. <source>Cells</source> <volume>183</volume>:<fpage>1735</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2020.11.032</pub-id>, PMID: <pub-id pub-id-type="pmid">33306958</pub-id></citation></ref>
<ref id="ref48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Whittaker</surname> <given-names>G. R.</given-names></name> <name><surname>Helenius</surname> <given-names>A.</given-names></name></person-group> (<year>1998</year>). <article-title>Nuclear import and export of viruses and virus genomes</article-title>. <source>Virology</source> <volume>246</volume>, <fpage>1</fpage>&#x2013;<lpage>23</lpage>. doi: <pub-id pub-id-type="doi">10.1006/viro.1998.9165</pub-id></citation></ref>
<ref id="ref49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>K. E.</given-names></name> <name><surname>Fazal</surname> <given-names>F. M.</given-names></name> <name><surname>Parker</surname> <given-names>K. R.</given-names></name> <name><surname>Zou</surname> <given-names>J.</given-names></name> <name><surname>Chang</surname> <given-names>H. Y.</given-names></name></person-group> (<year>2020</year>). <article-title>RNA-GPS predicts SARS-CoV-2 RNA residency to host mitochondria and nucleolus</article-title>. <source>Cell Syst.</source> <volume>11</volume>:<fpage>e103</fpage>, <fpage>102</fpage>&#x2013;<lpage>108.e3</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cels.2020.06.008</pub-id></citation></ref>
<ref id="ref50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname> <given-names>Y.</given-names></name> <name><surname>Karki</surname> <given-names>C. B.</given-names></name> <name><surname>Du</surname> <given-names>D.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Sobitan</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Spike proteins of SARS-CoV and SARS-CoV-2 utilize different mechanisms to bind with Human ACE2</article-title>. <source>Front. Mol. Biosci.</source> <volume>7</volume>:<fpage>591873</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fmolb.2020.591873</pub-id>, PMID: <pub-id pub-id-type="pmid">33363207</pub-id></citation></ref>
<ref id="ref51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Geng</surname> <given-names>H.</given-names></name> <name><surname>Deng</surname> <given-names>Y.</given-names></name> <name><surname>Huang</surname> <given-names>B.</given-names></name> <name><surname>Guo</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>The structural and accessory proteins M, ORF 4a, ORF 4b, and ORF 5 of Middle East respiratory syndrome coronavirus (MERS-CoV) are potent interferon antagonists</article-title>. <source>Protein Cell</source> <volume>4</volume>, <fpage>951</fpage>&#x2013;<lpage>961</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s13238-013-3096-8</pub-id>, PMID: <pub-id pub-id-type="pmid">24318862</pub-id></citation></ref>
<ref id="ref52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Cruz-Cosme</surname> <given-names>R.</given-names></name> <name><surname>Zhuang</surname> <given-names>M. W.</given-names></name> <name><surname>Liu</surname> <given-names>D.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Teng</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>A systemic and molecular study of subcellular localization of SARS-CoV-2 proteins</article-title>. <source>Signal Transduct. Target. Ther.</source> <volume>5</volume>:<fpage>269</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41392-020-00372-8</pub-id>, PMID: <pub-id pub-id-type="pmid">33203855</pub-id></citation></ref>
<ref id="ref53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Richards</surname> <given-names>A.</given-names></name> <name><surname>Barrasa</surname> <given-names>M. I.</given-names></name> <name><surname>Hughes</surname> <given-names>S. H.</given-names></name> <name><surname>Young</surname> <given-names>R. A.</given-names></name> <name><surname>Jaenisch</surname> <given-names>R.</given-names></name></person-group> (<year>2021</year>). <article-title>Reverse-transcribed SARS-CoV-2 RNA can integrate into the genome of cultured human cells and can be expressed in patient-derived tissues</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>118</volume>. doi: <pub-id pub-id-type="doi">10.1073/pnas.2105968118</pub-id></citation></ref>
<ref id="ref54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>C.</given-names></name> <name><surname>Zheng</surname> <given-names>W.</given-names></name> <name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Bell</surname> <given-names>E. W.</given-names></name> <name><surname>Zhou</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name></person-group> (<year>2020</year>). <article-title>Protein structure and sequence reanalysis of 2019-nCoV genome refutes snakes as its intermediate host and the unique similarity between its spike protein insertions and HIV-1</article-title>. <source>J. Proteome Res.</source> <volume>19</volume>, <fpage>1351</fpage>&#x2013;<lpage>1360</lpage>. doi: <pub-id pub-id-type="doi">10.1021/acs.jproteome.0c00129</pub-id>, PMID: <pub-id pub-id-type="pmid">32200634</pub-id></citation></ref></ref-list>
<fn-group>
<fn id="fn0005"><p><sup>1</sup><ext-link xlink:href="https://www.ncbi.nlm.nih.gov/tools/cobalt/re_cobalt.cgi" ext-link-type="uri">https://www.ncbi.nlm.nih.gov/tools/cobalt/re_cobalt.cgi</ext-link></p></fn>
<fn id="fn0006"><p><sup>2</sup><ext-link xlink:href="https://psort.hgc.jp/form2.html" ext-link-type="uri">https://psort.hgc.jp/form2.html</ext-link></p></fn>
<fn id="fn0007"><p><sup>3</sup><ext-link xlink:href="http://pridb.gdcb.iastate.edu/RPISeq/" ext-link-type="uri">http://pridb.gdcb.iastate.edu/RPISeq/</ext-link></p></fn>
</fn-group>
</back>
</article>