<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<?covid-19-tdm?>
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="methods-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Med.</journal-id>
<journal-title>Frontiers in Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Med.</abbrev-journal-title>
<issn pub-type="epub">2296-858X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmed.2021.790662</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Medicine</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>CalmBelt: Rapid SARS-CoV-2 Genome Characterization for Outbreak Tracking</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Yingtaweesittikul</surname> <given-names>Hatairat</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x02020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ko</surname> <given-names>Karrie</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x02020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Abdul Rahman</surname> <given-names>Nurdyana</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Tan</surname> <given-names>Shireen Yan Ling</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Nagarajan</surname> <given-names>Niranjan</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Suphavilai</surname> <given-names>Chayaporn</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1505252/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Advanced Research Center for Computational Simulation, Faculty of Science, Chiang Mai University</institution>, <addr-line>Chiang Mai</addr-line>, <country>Thailand</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Mathematics, Faculty of Science, Chiang Mai University</institution>, <addr-line>Chiang Mai</addr-line>, <country>Thailand</country></aff>
<aff id="aff3"><sup>3</sup><institution>Genome Institute of Singapore, A&#x0002A;STAR</institution>, <addr-line>Singapore</addr-line>, <country>Singapore</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Microbiology, Singapore General Hospital</institution>, <addr-line>Singapore</addr-line>, <country>Singapore</country></aff>
<aff id="aff5"><sup>5</sup><institution>Department of Molecular Pathology, Singapore General Hospital</institution>, <addr-line>Singapore</addr-line>, <country>Singapore</country></aff>
<aff id="aff6"><sup>6</sup><institution>Duke-NUS Medical School</institution>, <addr-line>Singapore</addr-line>, <country>Singapore</country></aff>
<aff id="aff7"><sup>7</sup><institution>Yong Loo Lin School of Medicine, National University of Singapore</institution>, <addr-line>Singapore</addr-line>, <country>Singapore</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Zisis Kozlakidis, International Agency For Research On Cancer (IARC), France</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Dawei Cui, Zhejiang University School of Medicine, China; Io Cheong, Shanghai Jiao Tong University, China</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Chayaporn Suphavilai <email>suphavilaic&#x00040;gis.a-star.edu.sg</email></corresp>
<fn fn-type="other" id="fn001"><p>This article was submitted to Infectious Diseases - Surveillance, Prevention and Treatment, a section of the journal Frontiers in Medicine</p></fn>
<fn fn-type="equal" id="fn002"><p>&#x02020;These authors have contributed equally to this work</p></fn></author-notes>
<pub-date pub-type="epub">
<day>14</day>
<month>12</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>8</volume>
<elocation-id>790662</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>10</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>11</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2021 Yingtaweesittikul, Ko, Abdul Rahman, Tan, Nagarajan and Suphavilai.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Yingtaweesittikul, Ko, Abdul Rahman, Tan, Nagarajan and Suphavilai</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license> 
</permissions>
<abstract><p><bold>Background:</bold> The ongoing COVID-19 pandemic is a global health crisis caused by the spread of SARS-CoV-2. Establishing links between known cases is crucial for the containment of COVID-19. In the healthcare setting, the ability to rapidly identify potential healthcare-associated COVID-19 clusters is critical for healthcare worker and patient safety. Increasing sequencing technology accessibility has allowed routine clinical diagnostic laboratories to sequence SARS-CoV-2 in clinical samples. However, these laboratories often lack specialized informatics skills required for sequence analysis. Therefore, an on-site, intuitive sequence analysis tool that enables clinical laboratory users to analyze multiple genomes and derive clinically relevant information within an actionable timeframe is needed.</p>
<p><bold>Results:</bold> We propose CalmBelt, an integrated framework for on-site whole genome characterization and outbreak tracking. Nanopore sequencing technology enables on-site sequencing and construction of draft genomes for multiple SARS-CoV-2 samples within 12 h. CalmBelt&#x00027;s interactive interface allows users to analyse multiple SARS-CoV-2 genomes by utilizing whole genome information, collection date, and additional information such as predefined potential clusters from epidemiological investigations. CalmBelt also integrates established SARS-CoV-2 nomenclature assignments, GISAID clades and PANGO lineages, allowing users to visualize relatedness between samples together with the nomenclatures. We demonstrated multiple use cases including investigation of potential hospital transmission, mining transmission patterns in a large outbreak, and monitoring possible diagnostic-escape.</p>
<p><bold>Conclusions:</bold> This paper presents an on-site rapid framework for SARS-CoV-2 whole genome characterization. CalmBelt interactive web application allows non-technical users, such as routine clinical laboratory users in hospitals to determine SARS-CoV-2 variants of concern, as well as investigate the presence of potential transmission clusters. The framework is designed to be compatible with routine usage in clinical laboratories as it only requires readily available sample data, and generates information that impacts immediate infection control mitigations.</p></abstract>
<kwd-group>
<kwd>SARS-CoV-2</kwd>
<kwd>whole genome sequencing</kwd>
<kwd>outbreak tracking</kwd>
<kwd>nanopore sequencing</kwd>
<kwd>web application</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="0"/>
<equation-count count="1"/>
<ref-count count="41"/>
<page-count count="11"/>
<word-count count="6443"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>The ongoing coronavirus disease (COVID-19) pandemic, caused by the betacoronavirus SARS-CoV-2, is a rapidly evolving global health crisis. As of 13th September 2021, more than 224 million cases of COVID-19 resulting in more than 4.6 million deaths have occurred worldwide (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). In Singapore, 71,687 COVID-19 cases have been identified since the beginning of the pandemic (<xref ref-type="bibr" rid="B3">3</xref>). The aggressive contact tracing and quarantine efforts had helped to reduce the spread of SARS-CoV-2 in Singapore (<xref ref-type="bibr" rid="B4">4</xref>).</p>
<p>The sequencing of SARS-CoV-2 from clinical samples is crucial for the understanding and control of SARS-CoV-2. Genomic surveillance of SARS-CoV-2 enables the detection and close monitoring of emergent variants which may be associated with increased transmissibility or disease severity, or which may impair the effectiveness of current vaccines, diagnostic methods, therapeutics, and public health control strategies. Emerging SARS-CoV-2 variants are closely monitored by WHO (<xref ref-type="bibr" rid="B5">5</xref>) and various health authorities (<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B7">7</xref>), emphasizing the importance of genomic surveillance. Additionally, whole-genome comparative analysis of SARS-CoV-2 from clinical samples provides valuable transmission information to guide clustering of linked COVID-19 cases (<xref ref-type="bibr" rid="B8">8</xref>). This is particularly useful where epidemiological data alone is insufficient to link cases due to human and circumstantial factors. Clustering of linked cases facilitates the use of contact tracing and quarantine measures to limit the spread of SARS-CoV-2.</p>
<p>Since the first SARS-CoV-2 whole-genome sequences were made available on the sequence repository GISAID (<xref ref-type="bibr" rid="B9">9</xref>) in January 2020, over 3.4 million SARS-CoV-2 sequences have been shared from around the world. The availability of low cost handheld sequencers, such as Oxford Nanopore Technologies (ONT) (<xref ref-type="bibr" rid="B10">10</xref>), has significantly lowered entry and sequencing costs, allowing many laboratories to sequence SARS-CoV-2 from clinical samples. These laboratories can share and analyse the SARS-CoV-2 whole-genome sequences at the regional and population level via GISAID (<xref ref-type="bibr" rid="B9">9</xref>) and genomic analytic platforms such as Nextstrain (<xref ref-type="bibr" rid="B8">8</xref>), allowing large-scale pathogen evolution tracking.</p>
<p>However, barriers remain in place that limit the ability of these sentinel laboratories to obtain meaningful analysis of small sets of locally sequenced SARS-CoV-2 genomes for the purposes of local outbreak investigations. One key barrier is that diagnostic laboratories often lack specialized informatics skills for the analysis of whole-genome sequence data. This results in delays to analysis of the data thus obtained.</p>
<p>Another barrier in place is that the PANGO lineage nomenclature (<xref ref-type="bibr" rid="B11">11</xref>) currently used for the classification of SARS-CoV-2 outbreaks does not provide the resolution required for local outbreak investigations. The PANGO lineage assigned to a SARS-CoV-2 whole-genome sequence is based on a large phylogenetic tree of SARS-CoV-2 genomes. As it is not practical to rebuild the large phylogenetic tree whenever new genomes become available, the new genomes are classified into different subtrees (lineages) according to the prediction from a machine learning model, which has been regularly trained to predict lineage using whole genome information. However, the performance of the machine learning model (decision tree) is not perfect, with a macro-average precision of 91.66% and a recall of 91.51% across 778 pre-defined PANGO lineages (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B12">12</xref>). Additionally, some pre-defined sets of mutations (decision tree rules) for classifying PANGO lineages are limited. For instance, only 79 genomic loci [with 12 mutations (<xref ref-type="bibr" rid="B13">13</xref>)] were chosen by the decision tree for classifying lineage B.1.617.2 (<xref ref-type="bibr" rid="B14">14</xref>).</p>
<p>To address these barriers, we propose CalmBelt, an integrated framework for on-site whole-genome characterization and outbreak tracking. Compared to existing analytic frameworks such as GISAID and Nextstrain (<xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B9">9</xref>), CalmBelt addresses the issue of resolution required for local outbreak investigations by using data driven analysis based on whole-genome sequence and sample collection information as an alternative strategy to the pre-defined phylogenetic tree and machine learning model of the PANGO lineage. Furthermore, unlike available command-line bioinformatics tools (<xref ref-type="bibr" rid="B11">11</xref>, <xref ref-type="bibr" rid="B15">15</xref>&#x02013;<xref ref-type="bibr" rid="B17">17</xref>), CalmBelt provides an easy-to-use platform for sentinel clinical diagnostic laboratories to analyse whole-genome sequences on-site, as soon as they become available. The intuitive design of CalmBelt allows users to integrate sample collection date and pre-defined epidemiological data together with whole-genome sequence data. With just a few clicks, CalmBelt can provide a customized visualization of genome relatedness together with the established SARS-CoV-2 nomenclature of GISAID clades and PANGO lineages for each whole-genome sequence. Therefore, CalmBelt allows users to preliminarily and rapidly interrogate the locally generated set of whole-genome sequence data, negating the biohazard risks and delay associated with SARS-CoV-2 sample transfer, or delay associated with submission to a curated database such as GISAID (<xref ref-type="bibr" rid="B9">9</xref>).</p>
<p>We demonstrate the deployment of CalmBelt in a hospital diagnostic laboratory, where ONT minION (<xref ref-type="bibr" rid="B10">10</xref>) was used to generate SARS-CoV-2 whole-genome sequences from clinical samples on-site. CalmBelt enabled actionable information to be generated within 12 h following the detection of SARS-CoV-2 in a clinical sample. This ability to rapidly sequence and analyse SARS-CoV-2 whole-genome data enabled the swift implementation of local infection control measures, which are particularly important in suspected healthcare-associated transmission clusters.</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and Methods</title>
<sec>
<title>On-Site SARS-CoV-2 Genome Sequencing</title>
<p>Nasopharyngeal swab samples were routinely tested using the Cepheid Xpert Xpress SARS-CoV-2 assay or the Roche cobas SARS-CoV-2 test. The routine diagnostic tests were performed in a CAP-accredited laboratory in a tertiary hospital, in biosafety level 2 plus containment. In brief, laboratory personnel in full PPE (<xref ref-type="bibr" rid="B18">18</xref>) performed all sample processing and chemical inactivation within a biosafety cabinet. All nasopharyngeal swabs were chemically inactivated (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B20">20</xref>) for 30 min prior to transfer to the GeneXpert Infinity (Cepheid) in biosafety level 2 containment, or cobas 6800 System (Roche) in biosafety level 2 plus containment, for the SARS-CoV-2 tests. Remnant clinical samples found to be positive for SARS-CoV-2 RNA, with a Ct value of &#x0003C;31 were subjected to an additional round of chemical inactivation (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B20">20</xref>) within the biosafety cabinet within biosafety level 2 plus containment, in the same laboratory. Total nucleic acid extraction of the chemically inactivated remnant samples were performed using the NucliSENS easyMag (bioMerieux) platform. The resultant total nucleic acid extract was used for downstream RT-PCR, and sequencing on ONT MinION in accordance with the ARTIC protocol v3 (<xref ref-type="bibr" rid="B21">21</xref>), within the same laboratory, in biosafety level 2 containment. A maximum of 25 clinical samples was sequenced on an ONT MinION sequencer in a single run. The laboratory has the capability to obtain SARS-CoV-2 sequence data from 50 clinical samples with two available ONT MinION setups. RAMPART protocol (<xref ref-type="bibr" rid="B22">22</xref>) was used to monitor the depth of coverage for each sample and to construct a draft genome. A previously sequenced clinical sample and a negative control (no template control) were included as positive and negative controls in every run.</p>
</sec>
<sec>
<title>SARS-CoV-2 Genome Data</title>
<p>SARS-CoV-2 genomes collected in Singapore were obtained from GISAID (3,406 genomes as of 30 June 2021; <xref ref-type="supplementary-material" rid="SM1">Supplementary File 1</xref>). Genomes data collected from non-human hosts and environment were discarded. Missing collection dates were imputed with the first date of the respective month. Clade and lineage information were also downloaded from GISAID, where the clade the trends were calculated based on rolling average (7 days). Specific information of 99 de-identified positive cases used in the case studies was collected in Singapore General Hospital between January to August 2020 (<xref ref-type="supplementary-material" rid="SM2">Supplementary File 2</xref>).</p>
</sec>
<sec>
<title>Identifying Mutation</title>
<p>Each SARS-CoV-2 genome obtained from on-site sequencing or GISAID was aligned to the standard SARS-CoV-2 reference genome (NC_045512.2) (<xref ref-type="bibr" rid="B23">23</xref>), using blastn. The alignment output in XML format was used for identifying single nucleotide polymorphisms (SNPs), insertion and deletion (Indels) with respect to the nucleotide position of the reference genome. For the genomes with multiple alignment blocks, the priority for identifying SNPs and Indels in the overlapping region was given to the longer alignment block.</p>
</sec>
<sec>
<title>Visualization of Overall Trends</title>
<p>To visualize the overall trends within a country, we employ two different types; a 2D scatter plot via tSNE (<xref ref-type="bibr" rid="B24">24</xref>) and an interactive dendrogram. We begin by calculating nucleotide diversity at each position using</p>
<disp-formula id="E1"><mml:math id="M1"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:mi>D</mml:mi><mml:mi>i</mml:mi><mml:mi>v</mml:mi><mml:mi>e</mml:mi><mml:mi>r</mml:mi><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>t</mml:mi><mml:mi>y</mml:mi><mml:mtext>&#x000A0;</mml:mtext><mml:mo>=</mml:mo><mml:mo>-</mml:mo><mml:mstyle displaystyle="true"><mml:munder class="msub"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x02208;</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:mi>A</mml:mi><mml:mo>,</mml:mo><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mi>C</mml:mi><mml:mo>,</mml:mo><mml:mi>G</mml:mi></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:mrow></mml:munder></mml:mstyle><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mi>l</mml:mi><mml:mi>o</mml:mi><mml:mi>g</mml:mi><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>x</italic><sub><italic>i</italic></sub> is a frequency of each nucleotide and <inline-formula><mml:math id="M2"><mml:munder class="msub"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>&#x02208;</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:mi>A</mml:mi><mml:mo>,</mml:mo><mml:mi>T</mml:mi><mml:mo>,</mml:mo><mml:mi>C</mml:mi><mml:mo>,</mml:mo><mml:mi>G</mml:mi></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:mrow></mml:munder><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mn>1</mml:mn></mml:math></inline-formula>.</p>
<p>We then choose top 50 positions with highest diversity and positions that are predefined in GISAID (<xref ref-type="bibr" rid="B25">25</xref>). The high diversity positions were then used for calculating hamming distance among all 3,406 genomes for tSNE and dendrogram plots. For tSNE plot, we also applied k-means clustering, where k was set to 8, which is equal to the number lineages predefined by WHO.</p>
</sec>
<sec>
<title>Outbreak Tracking Using Whole-Genome Information</title>
<p>For outbreak tracking, users can input multiple SARS-CoV-2 genomes (the maximum number of input genomes &#x02264;200) obtained from the on-site sequencing platform. The input file should be in fasta format, where each input file contains one genome. The file name must follow <italic>SampleID_dd-mm-yyyy_GroupName.fasta</italic>, which consists of sampling identifier, collection date and predefined group name such as a location.</p>
<p>Each input genome is aligned to the SARS-CoV-2 reference genome using blastn, and GISAID clade is reported (<xref ref-type="bibr" rid="B25">25</xref>) (<xref ref-type="supplementary-material" rid="SM3">Supplementary File 3</xref>). A standard lineage identification model (version 3.1.15) was installed for predicting PANGO lineage of each input genome (<xref ref-type="bibr" rid="B11">11</xref>), in line with the nomenclature used worldwide. CalmBelt also alerts users when the breadth of coverage is &#x0003C;95%, allowing users to carefully analyse low-quality genome data.</p>
<p>To construct a phylogenetic tree of the input genomes, we followed the steps used for determining PANGO lineage by using these specific options &#x0201C;<italic>mafft &#x02013;retree 2 concat.fasta</italic> &#x0003E; <italic>concat.mafft&#x0201D;</italic> and &#x0201C;<italic>iqtree2 -s concat.mafft -m GTR</italic>&#x0002B;<italic>G&#x0201D;</italic> (<xref ref-type="bibr" rid="B11">11</xref>). Similar to Nextstrain, we applied TreeTime (<xref ref-type="bibr" rid="B26">26</xref>) to generate time stamped phylogenies (Nextstrain&#x00027;s transmission tree) of the input genomes. To generate a similarity tree of the input genomes, whole-genome alignment information from blastn was used for calculating normalized hamming distance, and UPGMA clustering was applied on the distance matrix. In addition, as the hierarchical clustering process could introduce ambiguity for a large number of closely related genomes, a heatmap of distance matrix was also displayed to provide a quantitative measure of relatedness (i.e., number of different nucleotide positions).</p>
<p>An interactive similarity tree is drawn based on the whole-genome distance matrix alongside the collection date. Each node is colored according to the group name. Within the interactive tree, CalmBelt reports a subset of mutations and amino acid changes (with respect to blastn result). In the case that there are &#x0003C;3 nucleotides (i.e., frameshift mutations) to translate for an amino acid, the amino acid is marked as &#x0201C;X.&#x0201D; A full list of mutations is reported in a downloadable table. Monthly statistics of each PANGO lineage or sublineage in each country is also provided.</p>
</sec>
<sec>
<title>Inspecting Changes Within the Genomic Region of Interest</title>
<p>We implemented a portal where users can inspect specific genomic regions and mutations of interest of the genomes (3,406 genomes from GISAID) that have been processed in the previous step. Once users input the region of interest, SNPs and Indels are reported in multiple interactive charts. The charts display both nucleotide and amino acid changes that occurred in each month. To inspect concurrent mutations or variants of concerns, the portal reports the number of occurrences based on a list of mutations from users. These features are useful for detecting diagnostic-escape by inspecting primer binding sites and inspecting concurrent mutations.</p>
</sec>
<sec>
<title>Software and Packages</title>
<p>For implementing CalmBelt and analyses, we used multiple Python packages including pandas 1.1.3, matplotlib 3.3.2, numpy 1.19.2, scipy 1.5.2, seaborn 0.11.0, plotly 4.14.3, ray 1.1.0, sklearn 0.23.2, biopython 1.78, dash 1.19.0. Additional software packages include Blastn 2.6 (<xref ref-type="bibr" rid="B15">15</xref>), Pango 3.1.7 (<xref ref-type="bibr" rid="B11">11</xref>), Mafft (&#x02013;retree 2) (<xref ref-type="bibr" rid="B16">16</xref>), IQTREE-2 (-m GTR&#x0002B;G) (<xref ref-type="bibr" rid="B17">17</xref>), and TreeTime (<xref ref-type="bibr" rid="B26">26</xref>). CalmBelt&#x00027;s source code and an installation guideline are available at <ext-link ext-link-type="uri" xlink:href="https://github.com/BioML-CM/CalmBelt">https://github.com/BioML-CM/CalmBelt</ext-link>. The demo version and example data is available at <ext-link ext-link-type="uri" xlink:href="https://calmbelt-demo.mtms.dev">https://calmbelt-demo.mtms.dev</ext-link>.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec>
<title>Whole Genome Characterization and Clustering for Outbreak Investigation</title>
<p>Nasopharyngeal swab samples were routinely tested using the Cepheid Xpert Xpress SARS-CoV-2 assay or the Roche cobas SARS-CoV-2 test. Samples found to be positive for SARS-CoV-2 RNA, with a Ct value of &#x0003C;31 were subjected to total nucleic acid extraction using the NucliSENS easyMag (bioMerieux) platform. The total nucleic acid extract was used for downstream RT-PCR, and sequencing on ONT MinION in accordance with the ARTIC protocol v3 (<xref ref-type="bibr" rid="B21">21</xref>). RAMPART protocol (<xref ref-type="bibr" rid="B22">22</xref>) was used to monitor the depth of coverage for each sample and to construct a draft genome (<bold>Methods</bold>; <xref ref-type="fig" rid="F1">Figure 1A</xref>).</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>CalmBelt overview. <bold>(A)</bold> On-site sequencing protocol based on the Nanopore sequencing platform and ARCTIC protocol for sequencing and generating draft genomes. <bold>(B)</bold> Rapid analysis pipeline. Multiple SARS-CoV-2 genomes are aligned to the reference genome. A distance matrix calculated based on whole-genome alignment is used for hierarchical clustering. CalmBelt automatically generates an interactive tree capturing whole genome similarity, collection date (x-axis) and case information (color).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-790662-g0001.tif"/>
</fig>
<p>Once the draft genome became available, Users dragged and dropped the SARS-CoV-2 genome files into the analysis interface (<xref ref-type="fig" rid="F1">Figure 1B</xref>). Multiple genomes from on-site sequencing were aligned to the reference genome. ClamBelt then identified mutations, calculated whole genome similarity, and constructed multiple trees for transmission tracking (<bold>Methods</bold>). As the number of mutations per genome continued to increase (&#x0007E;2&#x02013;3 mutations per month; <xref ref-type="supplementary-material" rid="SM4">Supplementary Figure 1</xref>), CalmBelt only visualized a subset of mutations while providing the downloadable full list of mutations.</p>
<p>The similarity tree captures hierarchical clustering results based on the whole genome similarity. The x-axis represents collection date, and colors represent case-specific information such as locations, as defined by the users. CalmBelt integrates existing nomenclatures including GISAID clade (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B25">25</xref>) and PANGO lineages (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B27">27</xref>). For each case, comprehensive information including mutations at nucleotide- and amino acid-level can be displayed interactively.</p>
<p>As highlighted in the Nextstrain web portal (<xref ref-type="bibr" rid="B28">28</xref>), &#x0201C;copying mistakes&#x0201D; that accumulate in the genome could facilitate tracking of transmission routes and dynamics, while a phylogenetic tree could infer locations of each case. CalmBelt therefore visualizes multiple types of trees, as well as a distance matrix capturing pairwise distance between SARS-CoV-2 genomes, to provide multiple perspectives for epidemiology units (<xref ref-type="fig" rid="F1">Figure 1B</xref>; <xref ref-type="supplementary-material" rid="SM5">Supplementary Figure 2</xref>).</p>
<p>Besides, CalmBelt analyzed overall statistics for a large set of 3,406 genomes from Singapore (<xref ref-type="fig" rid="F2">Figure 2</xref>, Methods). Users can inspect the statistics based on genomic information in terms of GISAID clade, which captures the trends at the beginning of the pandemic, and the newly defined PANGO lineage name according to WHO (<xref ref-type="fig" rid="F2">Figure 2A</xref>). For example, we observed a clear dominant clade from April 2020 to September 2020, corresponding to the foreign worker dormitory outbreak in Singapore (<xref ref-type="bibr" rid="B29">29</xref>). Apart from the period of dormitory outbreak, the trends we observed in the Singapore data are more similar to the trend observed across countries in Asia compared to the trends observed in other continents, in line with geographical information (<xref ref-type="supplementary-material" rid="SM6">Supplementary Figures 3</xref>, <xref ref-type="supplementary-material" rid="SM7">4</xref>).</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>Statistics of SARS-CoV-2 genomes in Singapore (January 2020&#x02013;June 2021). <bold>(A)</bold> A time series presenting proportion of different clades based on GISAID criteria and the newly defined lineage name according to WHO. <bold>(B)</bold> Nucleotide diversity across SARS-CoV-2 genomic loci <bold>(C,D)</bold> T-SNE plots visualize clusters of SAR-CoV2 genomes, where the distances are based on high diversity loci <bold>(E,F)</bold> Dendrograms present different SAR-CoV2 genome along with collection date and lineage information.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-790662-g0002.tif"/>
</fig>
<p>Similar to Nextstrain (<xref ref-type="bibr" rid="B8">8</xref>), nucleotide diversity was calculated for each genome position. We observed various mutation rates across different genes (<xref ref-type="fig" rid="F2">Figure 2B</xref>). While mutations in the S gene, which encodes the Spike protein (<xref ref-type="bibr" rid="B30">30</xref>) is of particular interest due to its role in infectivity and vaccine efficacy, other genes (e.g., E gene, N gene) are monitored as they are commonly used as diagnostic targets (<xref ref-type="bibr" rid="B31">31</xref>). We note that CalmBelt shows information from all genomes without subsampling, a pre-processing step used in Nextstrain.</p>
<p>Genomic loci with high diversity were used for visualization (<xref ref-type="fig" rid="F2">Figures 2C&#x02013;F</xref>). Overlaying PANGO lineage information onto the 2D visualization, we observed multiple clusters that have the same lineage name (<xref ref-type="fig" rid="F2">Figures 2C,E</xref>). We found that clustering based on high diversity genomic loci could capture the foreign worker dormitory outbreak (C2; <xref ref-type="fig" rid="F2">Figures 2D,F</xref>) and distinguished Delta (B.1.617.2) into three different clusters (C0, C3, C5) that spreaded at distinct time periods, suggesting different sources of the outbreak even though all cases were annotated as Delta based on the newly assigned PANGO lineage.</p>
</sec>
<sec>
<title>Investigating Healthcare-Associated SARS-CoV-2 Transmission</title>
<p>Four healthcare workers working in the same institution were found to be positive for SARS-CoV-2 within a short span of time. There were concerns of healthcare-associated/occupationally acquired SARS-CoV-2 infections among the healthcare workers. Therefore, on-site sequencing was performed for 4 healthcare workers&#x00027; samples, along with 6 samples from the community and 2 samples from dormitory residents. A similar pattern was observed across different types of trees (<xref ref-type="fig" rid="F3">Figures 3A,B</xref>, Methods). The similarity and transmission trees had the added advantage of capturing temporal relationships based on collection date information, which are useful adjuncts in outbreak investigations. Based on CalmBeIt&#x00027;s outputs, it was concluded that sequences from the four de-identified healthcare workers belonged to different clusters, suggesting that SARS-CoV-2 transmission did not occur in the healthcare or occupational setting in this instance.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Relationship of 12 SARS-CoV-2 genomes observed in the community (C), healthcare workers (H), and dormitory residents (D). <bold>(A)</bold> A similarity tree is based on a combination of whole genome similarity and collection date. <bold>(B)</bold> A phylogenetic tree based on multiple sequence alignment and a predefined mutation rate model (Mafft and IQ-TREE2), where <sup>&#x0002A;&#x0002A;</sup> indicate zero distance.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-790662-g0003.tif"/>
</fig>
<p>To enhance the ability to identify potential sources of epidemiologically unlinked cases, CalmBelt allows users to query for statistics of a given PANGO lineage in different countries for a specific month. For example, in March 2020, B.6.6 was widespread in Cambodia (2/19, 10.53%), Singapore (36/381, 9.45%) and Malaysia (5/56, 8.93%) (<xref ref-type="supplementary-material" rid="SM8">Supplementary Figure 5</xref>). This information will allow users to identify potential links for further epidemiological investigations.</p>
</sec>
<sec>
<title>Mining Transmission Patterns in a Large Outbreak</title>
<p>We inspected 89 randomly selected, de-identified positive cases from the foreign worker dormitory outbreak in Singapore between April to August 2020. Using CalmBelt&#x00027;s interactive tree, we observed two main clusters (<xref ref-type="fig" rid="F4">Figure 4</xref>). In the first cluster (orange color; left), the majority of the cases were from a single dormitory (D8), two cases were from D10 and one case was from D9. However, there are 5 cases from D8 in the second cluster, suggesting that there were at least two sources of the infection in D8. In the second cluster (mixed colors; right), cases from many dormitories were observed. Cases from the same dormitory tend to form a cluster, highlighting the spread of the SARS-CoV-2 virus within each dormitory. In addition, we observed multiple small clusters in some dormitories (e.g., within D2, S53 &#x0002B; S74 &#x0002B; S128, S136 &#x0002B; S137, S129 &#x0002B; S130 &#x0002B; S77, S157 &#x0002B; S132), which may suggest multiple sources and routes of transmission within D2.</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>A genome similarity tree shows the relationship among 89 randomly selected, de-identified positive cases which were labeled to be from dormitory residents. These positive cases were detected from 12 dormitories (D1&#x02013;D12) from the foreign worker dormitory outbreak in Singapore (April&#x02013;August 2020). Each data point represents a positive case, and colors represent different, de-identified dormitories.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-790662-g0004.tif"/>
</fig>
<p>While PANGO lineages are meant to delineate outbreaks, in the setting of a rapidly disseminating local outbreaks, the resolution offered by PANGO lineage assignment alone is likely to be insufficient. For example, in the case of this large-scale dormitory outbreak, the majority of the cases (73%) were annotated as B.6.6. CalmBelt was able to capture whole genome similarity and increased the resolution, thereby delineating possible clusters within each dormitory.</p>
</sec>
<sec>
<title>Monitoring Possible Diagnostic-Escape</title>
<p>CalmBelt can be used to monitor genomic mutations and allow users to investigate genomic regions of interest. As a use case, we selected three genomic regions in the N gene, based on PCR primers used for the detection of N gene [US-CDC-N1 to N3 (<xref ref-type="bibr" rid="B32">32</xref>); <xref ref-type="fig" rid="F5">Figure 5A</xref>]. We found that mutations occurred in &#x0003C;5% of Singapore sequences (18 out of 598 and 6 out of 401) in the regions primed by US-CDC-N1 and US-CDC-N3. However, for the region primed by US-CDC-N2, we observed a higher percentage (19%) of Singapore sequences that harbor a mutation at position 29,179. This tool therefore allows users to monitor for emerging diagnostic escapes, based on the local laboratories&#x00027; primer sequences and relevant regional SARS-CoV-2 sequence data.</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p>Inspecting mutations in a specific region for each month. <bold>(A)</bold> Mutation frequencies of three genomic regions in the N gene (PCR primers US-CDC-N1 to N3). <bold>(B&#x02013;D)</bold> CalmBelt reports the number of cases for each amino acid change (missense mutation) according to user input. <bold>(D)</bold> Number of cases harboring co-occurrence amino acid changes (L452R and P681R in S gene).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-790662-g0005.tif"/>
</fig>
<p>As the number of mutations per genome continued to accumulate, &#x0007E;2&#x02013;3 new mutations emerged per month (<xref ref-type="supplementary-material" rid="SM4">Supplementary Figure 1</xref>). CalmBelt allows users to input a custom list of mutations and reports the number of cases where each mutation is present. For example, we added a list of mutations occurring in B.1.617.2 lineage or Delta (<xref ref-type="bibr" rid="B13">13</xref>) including variants of biological significance S:P681R and S:L452R which are associate with viral infectivity and reduction in antibody neutralization in the presence of other mutations in S gene (<xref ref-type="bibr" rid="B33">33</xref>, <xref ref-type="bibr" rid="B34">34</xref>) (<xref ref-type="fig" rid="F5">Figure 5B</xref>). Alternatively, users can input a protein name and a range of amino acid loci (<xref ref-type="fig" rid="F5">Figure 5C</xref>). CalmBelt also allows users to input a specific set of mutations to observe the co-occurring frequency in each month (<xref ref-type="fig" rid="F5">Figure 5D</xref>). In our example, we found that the co-occurrence of two variants (S:P681R and S:L452R) is well-preserved, which suggests biological significance that warrants further investigations (<xref ref-type="bibr" rid="B35">35</xref>).</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>We present CalmBelt, a streamlined framework for on-site sequencing and analysis of SARS-CoV-2 genomes for outbreak tracking (<xref ref-type="fig" rid="F1">Figures 1</xref>, <xref ref-type="fig" rid="F2">2</xref>). Using the nanopore sequencing platform, we initiated sequencing on-site within the hospital diagnostic laboratory once clinical samples were found to be positive by routine RT-PCR testing. While nanopore technologies have significantly improved accessibility to sequencing capability, the ability to analyze sequence data within an actionable time frame remains a challenge for many hospital laboratories. CalmBelt was developed to close this gap by allowing typical diagnostic laboratory users with no formal bioinformatic training to analyze whole genome sequence data to facilitate outbreak investigations and control in the healthcare settings.</p>
<p>When CalmBelt was fully incorporated into the diagnostic laboratory&#x00027;s workflow, &#x0003C;24 h was required from nasopharyngeal swab sample receipt to CalmBelt outputs. This was achieved by the use of a routine RT-PCR diagnostic test with rapid turnaround time (Cepheid Xpert Xpress SARS-CoV-2 assay), as well as a workflow that initiated downstream processing for nanopore sequencing as soon as the sample was found to be positive for SARS-CoV-2. Calmbelt could generate an online report capturing relatedness of the samples analyzed, within 24 h of sample arrival in the laboratory, which is a timeframe compatible with infection control mitigations in the healthcare setting (<xref ref-type="fig" rid="F3">Figures 3</xref>, <xref ref-type="fig" rid="F4">4</xref>).</p>
<p>The repeated, rapid emergence of SARS-CoV-2 variants necessitates constant vigilance against variants that may escape routine diagnostic detection by commonly used RT-PCR assays (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B36">36</xref>). To that end, CalmBelt was designed to help users monitor for mutations in primer-binding sites, which is an important safeguard against plausible diagnostic-escapes (<xref ref-type="fig" rid="F5">Figure 5</xref>). The curated genomes in the GISAID SARS-CoV-2 database provides a great resource for us to gather mutation information within a specific country and across the globe, allowing us to track mutation patterns in certain genomic regions to monitor plausible diagnostic-escape (<xref ref-type="bibr" rid="B31">31</xref>). Even when proprietary primer sequences are used in commercial RT-PCR assays, CalmBelt allows mutations in the targeted gene(s) to be monitored by the users, and questions can be raised to assay manufacturers if any unusual trends are observed.</p>
<p>A major criticism of the nanopore platform has been the suboptimal sequencing accuracy. Using the improved ARCTIC protocol (<xref ref-type="bibr" rid="B21">21</xref>), we were able to obtain high accuracy genomes from most of the samples. Various recent studies similarly reported the successful use of nanopore platforms to obtain SARS-CoV-2 whole-genome sequences (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B37">37</xref>, <xref ref-type="bibr" rid="B38">38</xref>), and thousands of SARS-CoV-2 genomes submitted to GISAID were derived solely from nanopore sequencing. This demonstrates that the nanopore platform is able to generate adequately accurate SARS-CoV-2 sequence data for real-time downstream analyses. Given the small footprint, relatively low setup cost, nanopore will continue to play an important role in democratizing access to sequencing.</p>
<p>The B.1.617.2 (Delta) variant has rapidly become the dominant variant in Singapore by mid 2021. To delineate outbreak clusters among cases infected with B.1.617.2, CalmBelt was designed to achieve a higher resolution than the widely used PANGO lineage. Besides the suboptimal performance of the machine learning model for PANGO lineage prediction, as the number of accumulated mutations in SARS-CoV-2 genomes is growing (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B40">40</xref>), a single large phylogenetic tree could lose the resolution of retrospective cases (<xref ref-type="fig" rid="F4">Figure 4</xref>) as well as recent cases, where most cases are identified as Delta despite coming from different community clusters (<xref ref-type="bibr" rid="B8">8</xref>).</p>
<p>Several web applications for SARS-CoV-2 sequence analyses, such as Nextstrain (<xref ref-type="bibr" rid="B9">9</xref>), Audacity, PrimerChecker (<xref ref-type="bibr" rid="B9">9</xref>) and CoVariants (<xref ref-type="bibr" rid="B41">41</xref>), have been recently developed. However, none of these tools (except Nextstrain) focus on integrating custom user input and sample collection dates to create a specialized report for outbreak investigations and control mitigations in the healthcare settings. With the availability of nanopore sequencing technologies, sentinel clinical diagnostic laboratories performing routine SARS-CoV-2 RT-PCR testing are in the position to generate SARS-CoV-2 sequence data most rapidly and seamlessly from clinical samples and contribute to rapid local outbreak response. By integrating rapid diagnostic testing, on-site nanopore sequencing and intuitive genome analysis afforded by CalmBelt, we were able to generate outbreak reports from clinical samples within a day. In the event of sensitive clusters, such as hospitals, senior care homes and schools, the quick availability of such reports will complement manual contact tracing and contribute to faster and better control of spread among vulnerable or unvaccinated populations.</p>
<p>Although the use of the nanopore platform and easy-to-use informatic tools such as CalmBelt have made SARS-CoV-2 sequencing and analysis increasingly accessible, hurdles remain for large scale implementation. The consumable and manpower cost continue to be a challenge in resource-limited settings, as clinical diagnostic laboratories are generally designed and budgeted based on large-volume routine testing. While the COVID-19 pandemic might have accelerated the capital investment and development of molecular diagnostics in routine clinical laboratories, manpower well-versed in the sequence data interpretation and application may constrain implementation. Therefore, further development and human capital and sequencing laboratory setups are necessary to encourage large scale implementation of SARS-CoV-2 sequencing.</p>
<p>While the data presented in this paper is tailored to SARS-CoV-2 genome analysis, our bioinformatic workflow can be easily adapted for other viruses where the sequencing workflow can follow ARTIC network protocols (<xref ref-type="bibr" rid="B21">21</xref>). This versatility allows users deploying CalmBelt to build preparedness and resilience for outbreaks and pandemics beyond the current COVID-19 pandemic. Our strategy also demonstrated the feasibility of a rapid whole-genome sequencing framework in the healthcare setting, paving the way for further applications of rapid sequencing technologies in the clinical diagnostics.</p>
</sec>
<sec sec-type="data-availability" id="s5">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s9">Supplementary Material</xref>, further inquiries can be directed to the corresponding author/s.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>HY, KK, and CS planned and designed the project. HY developed a CalmBelt web application and performed all computational analysis with CS&#x00027;s supervision. NA and ST planned and performed wet-lab experiments with KK&#x00027;s supervision. NN provides feedback on computational and wet-lab experiments, as well as manuscripts. HY, KK, and CS wrote the manuscript with input from all authors. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>This work was supported by funding from Chiang Mai University, SingHealth Duke-NUS Academic Medicine [Grant Number AM/CSP012/2020 (SRDUKAMC2012)] and A<sup>&#x0002A;</sup>STAR. KK was supported by the Singapore National Medical Research Council research training fellowship.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s8">
<title>Publisher&#x00027;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec> 
</body>
<back>
<ack>
<p>We thank Dr. Kern Rei Chng for valuable insights and comments on the study and manuscript.</p>
</ack>
<sec sec-type="supplementary-material" id="s9">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmed.2021.790662/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmed.2021.790662/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary File 1</label>
<caption><p>Acknowledgment table SARS-CoV-2 genomes collected in Singapore from GISAID (30 June 2021).</p></caption> 
</supplementary-material>
<supplementary-material xlink:href="Table_2.XLSX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary File 2</label>
<caption><p>Detail of 99 de-identified positive cases collected in Singapore General Hospital (January to August 2020).</p></caption> 
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_2.PDF" id="SM3" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary File 3</label>
<caption><p>Mutations for GISAID clades.</p></caption> 
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="SM4" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 1</label>
<caption><p>Increasing mutation rate of 3,406 genomes from Singapore downloaded from GISAID (Jan 2020&#x02013;June 2021). Y-axis represents an average number of mutations per week.</p></caption> 
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="SM5" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 2</label>
<caption><p>In addition to a similarity tree and a list of mutations in <xref ref-type="fig" rid="F1">Figure 1B</xref>, CalmBelt provides a phylogenetic tree (<bold>A</bold>; IQTREE2 used in Pangolin), a transmission tree (<bold>B</bold>; TreeTime used in Nextstrain), and a heatmap <bold>(C)</bold> capturing the number of different nucleotides between every pair of genomes.</p></caption> 
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="SM6" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 3</label>
<caption><p>Time-series plots show the trend of GISAID clades across continents. We note that the trends might be slightly different from Nextstrain due to the subsampling process used in Nextstrain.</p></caption> 
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="SM7" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 4</label>
<caption><p>Time-series plots show the trend of PANGO lineage (based on the greek alphabets) across continents.</p></caption> 
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="SM8" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 5</label>
<caption><p>Statistics of B.6.6 lineage across different countries between March to May 2020.</p></caption> 
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>COVID Live Update: 161 080 581 Cases and 3 345 018 Deaths From the Coronavirus - Worldometer</collab></person-group>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.worldometers.info/coronavirus/">https://www.worldometers.info/coronavirus/</ext-link> (accessed May 13, 2021).</citation>
</ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="web"><source>WHO Coronavirus (COVID-19) Dashboard</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://covid19.who.int/">https://covid19.who.int/</ext-link> (accessed July 17, 2021).</citation>
</ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>MOH</collab></person-group>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.moh.gov.sg/covid-19">https://www.moh.gov.sg/covid-19</ext-link> (accessed May 13, 2021).</citation>
</ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>VJ</given-names></name> <name><surname>Chiew</surname> <given-names>CJ</given-names></name> <name><surname>Khong</surname> <given-names>WX</given-names></name></person-group>. <article-title>Interrupting transmission of COVID-19: lessons from containment efforts in Singapore</article-title>. <source>J Travel Med.</source> (<year>2020</year>) <volume>27</volume>:<fpage>taaa039</fpage>. <pub-id pub-id-type="doi">10.1093/jtm/taaa039</pub-id><pub-id pub-id-type="pmid">32167146</pub-id></citation></ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="web"><source>Tracking SARS-CoV-2 Variants</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.who.int/en/activities/tracking-SARS-CoV-2-variants/">https://www.who.int/en/activities/tracking-SARS-CoV-2-variants/</ext-link> (accessed July 17, 2021).</citation>
</ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>Public Health England. Investigation of SARS-CoV-2 Variants of Concern: Technical Briefings.</collab></person-group> (<year>2020</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.gov.uk/government/publications/investigation-of-novel-sars-cov-2-variant-variant-of-concern-20201201">https://www.gov.uk/government/publications/investigation-of-novel-sars-cov-2-variant-variant-of-concern-20201201</ext-link> (accessed July 17, 2021).</citation>
</ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>CDC. SARS-CoV-2 Variant Classifications and Definitions.</collab></person-group> (<year>2021</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.cdc.gov/coronavirus/2019-ncov/variants/variant-info.html">https://www.cdc.gov/coronavirus/2019-ncov/variants/variant-info.html</ext-link> (accessed July 17, 2021).</citation>
</ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hadfield</surname> <given-names>J</given-names></name> <name><surname>Megill</surname> <given-names>C</given-names></name> <name><surname>Bell</surname> <given-names>SM</given-names></name> <name><surname>Huddleston</surname> <given-names>J</given-names></name> <name><surname>Potter</surname> <given-names>B</given-names></name> <name><surname>Callender</surname> <given-names>C</given-names></name> <etal/></person-group>. <article-title>Nextstrain: real-time tracking of pathogen evolution</article-title>. <source>Bioinformatics.</source> (<year>2018</year>) <volume>34</volume>:<fpage>4121</fpage>&#x02013;<lpage>3</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty407</pub-id><pub-id pub-id-type="pmid">29790939</pub-id></citation></ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shu</surname> <given-names>Y</given-names></name> <name><surname>McCauley</surname> <given-names>J</given-names></name></person-group>. <article-title>GISAID: global initiative on sharing all influenza data &#x02013; from vision to reality</article-title>. <source>Euro Surveill.</source> (<year>2017</year>) <volume>22</volume>:<fpage>30494</fpage>. <pub-id pub-id-type="doi">10.2807/1560-7917.ES.2017.22.13.30494</pub-id><pub-id pub-id-type="pmid">28382917</pub-id></citation></ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bull</surname> <given-names>RA</given-names></name> <name><surname>Adikari</surname> <given-names>TN</given-names></name> <name><surname>Ferguson</surname> <given-names>JM</given-names></name> <name><surname>Hammond</surname> <given-names>JM</given-names></name> <name><surname>Stevanovski</surname> <given-names>I</given-names></name> <name><surname>Beukers</surname> <given-names>AG</given-names></name> <etal/></person-group>. <article-title>Analytical validity of nanopore sequencing for rapid SARS-CoV-2 genome analysis</article-title>. <source>Nat Commun.</source> (<year>2020</year>) <volume>11</volume>:<fpage>6272</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-20075-6</pub-id><pub-id pub-id-type="pmid">33298935</pub-id></citation></ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rambaut</surname> <given-names>A</given-names></name> <name><surname>Holmes</surname> <given-names>EC</given-names></name> <name><surname>O&#x00027;Toole</surname> <given-names>&#x000C1;</given-names></name> <name><surname>Hill</surname> <given-names>V</given-names></name> <name><surname>McCrone</surname> <given-names>JT</given-names></name> <name><surname>Ruis</surname> <given-names>C</given-names></name> <etal/></person-group>. <article-title>A dynamic nomenclature proposal for SARS-CoV-2 lineages to assist genomic epidemiology</article-title>. <source>Nat Microbiol.</source> (<year>2020</year>) <volume>5</volume>:<fpage>1403</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1038/s41564-020-0770-5</pub-id><pub-id pub-id-type="pmid">33514928</pub-id></citation></ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>T</given-names></name> <name><surname>Wu</surname> <given-names>Q</given-names></name> <name><surname>Zhang</surname> <given-names>Z</given-names></name></person-group>. <article-title>Probable pangolin origin of SARS-CoV-2 associated with the COVID-19 outbreak</article-title>. <source>Curr Biol.</source> (<year>2020</year>) <volume>30</volume>:<fpage>1578</fpage>. <pub-id pub-id-type="doi">10.1016/j.cub.2020.03.063</pub-id><pub-id pub-id-type="pmid">32315626</pub-id></citation></ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="web"><source>Lineage, B,.1.617.2</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://cov-lineages.org/global_report_B.1.617.2.html">https://cov-lineages.org/global_report_B.1.617.2.html</ext-link> (accessed May 24, 2021).</citation>
</ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>pangoLEARN-training</collab></person-group>. <article-title>Github</article-title>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://github.com/cov-lineages/pangoLEARN-training">https://github.com/cov-lineages/pangoLEARN-training</ext-link> (accessed July 17, 2021).</citation>
</ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Johnson</surname> <given-names>M</given-names></name> <name><surname>Zaretskaya</surname> <given-names>I</given-names></name> <name><surname>Raytselis</surname> <given-names>Y</given-names></name> <name><surname>Merezhuk</surname> <given-names>Y</given-names></name> <name><surname>McGinnis</surname> <given-names>S</given-names></name> <name><surname>Madden</surname> <given-names>TL</given-names></name></person-group>. <article-title>NCBI BLAST: a better web interface</article-title>. <source>Nucleic Acids Res.</source> (<year>2008</year>) <volume>36</volume>:<fpage>W5</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkn201</pub-id><pub-id pub-id-type="pmid">18440982</pub-id></citation></ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Katoh</surname> <given-names>K</given-names></name> <name><surname>Standley</surname> <given-names>DM</given-names></name></person-group>. <article-title>MAFFT multiple sequence alignment software version 7: improvements in performance and usability</article-title>. <source>Mol Biol Evol.</source> (<year>2013</year>) <volume>30</volume>:<fpage>772</fpage>&#x02013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst010</pub-id><pub-id pub-id-type="pmid">23329690</pub-id></citation></ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Minh</surname> <given-names>BQ</given-names></name> <name><surname>Schmidt</surname> <given-names>HA</given-names></name> <name><surname>Chernomor</surname> <given-names>O</given-names></name> <name><surname>Schrempf</surname> <given-names>D</given-names></name> <name><surname>Woodhams</surname> <given-names>MD</given-names></name> <name><surname>von Haeseler</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>IQ-TREE 2: new models and efficient methods for phylogenetic inference in the genomic era</article-title>. <source>Mol Biol Evol.</source> (<year>2020</year>) <volume>37</volume>:<fpage>1530</fpage>&#x02013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msaa015</pub-id><pub-id pub-id-type="pmid">32556291</pub-id></citation></ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>CDC. Performing Broad-Based Testing for SARS-CoV-2 in Congregate Correctional, Detention, and Homeless Service Settings.</collab></person-group> (<year>2021</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.cdc.gov/coronavirus/2019-ncov/hcp/broad-based-testing.html">https://www.cdc.gov/coronavirus/2019-ncov/hcp/broad-based-testing.html</ext-link> (accessed October 30, 2021).</citation>
</ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Welch</surname> <given-names>SR</given-names></name> <name><surname>Davies</surname> <given-names>KA</given-names></name> <name><surname>Buczkowski</surname> <given-names>H</given-names></name> <name><surname>Hettiarachchi</surname> <given-names>N</given-names></name> <name><surname>Green</surname> <given-names>N</given-names></name> <name><surname>Arnold</surname> <given-names>U</given-names></name> <etal/></person-group>. <article-title>Analysis of inactivation of SARS-CoV-2 by specimen transport media, nucleic acid extraction reagents, detergents, and fixatives</article-title>. <source>J Clin Microbiol.</source> (<year>2020</year>) <volume>58</volume>:<fpage>e01713</fpage>&#x02013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1128/JCM.01713-20</pub-id><pub-id pub-id-type="pmid">32839250</pub-id></citation></ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>Public Health England. SARS-CoV-2 Inactivation Testing: Interim Report.</collab></person-group> (<year>2020</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/898620/HCM-CoV2-015-v2_cobas_Omni_LYS_reagent_TCF.pdf">https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/898620/HCM-CoV2-015-v2_cobas_Omni_LYS_reagent_TCF.pdf</ext-link> (accessed June 30, 2021).</citation>
</ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="web"><source>Artic Network</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://artic.network/ncov-2019">https://artic.network/ncov-2019</ext-link> (accessed May 13, 2021).</citation>
</ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>rampart</collab></person-group>. <article-title>Github</article-title>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://github.com/artic-network/rampart">https://github.com/artic-network/rampart</ext-link> (accessed May 13, 2021).</citation>
</ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="web"><source>NCBI SARS-CoV-2 Resources</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/sars-cov-2/">https://www.ncbi.nlm.nih.gov/sars-cov-2/</ext-link> (accessed May 16, 2021).</citation>
</ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="web"><person-group person-group-type="author"><name><surname>van der Maaten</surname> <given-names>L</given-names></name></person-group>. <article-title>Visualizing Data using t-SNE</article-title>. (<year>2008</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.jmlr.org/papers/volume9/vandermaaten08a/vandermaaten08a.pdf?fbclid=IwA">https://www.jmlr.org/papers/volume9/vandermaaten08a/vandermaaten08a.pdf?fbclid=IwA</ext-link> (accessed July 25, 2021).</citation>
</ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>GISAID - Clade and Lineage Nomenclature Aids in Genomic Epidemiology of Active hCoV-19 Viruses</collab></person-group>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.gisaid.org/references/statements-clarifications/clade-and-lineage-nomenclature-aids-in-genomic-epidemiology-of-active-hcov-19-viruses/">https://www.gisaid.org/references/statements-clarifications/clade-and-lineage-nomenclature-aids-in-genomic-epidemiology-of-active-hcov-19-viruses/</ext-link> (accessed May 13, 2021).</citation>
</ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sagulenko</surname> <given-names>P</given-names></name> <name><surname>Puller</surname> <given-names>V</given-names></name> <name><surname>Neher</surname> <given-names>RA</given-names></name></person-group>. <article-title>TreeTime: maximum-likelihood phylodynamic analysis</article-title>. <source>Virus Evol.</source> (<year>2018</year>) <volume>4</volume>:<fpage>vex042</fpage>. <pub-id pub-id-type="doi">10.1093/ve/vex042</pub-id><pub-id pub-id-type="pmid">29340210</pub-id></citation></ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="web"><source>PANGO n-names>Lineages</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://cov-lineages.org/pangolin_docs/pangolearn.html">https://cov-lineages.org/pangolin_docs/pangolearn.html</ext-link> (accessed May 13, 2021).</citation>
</ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>How to Interpret the Phylogenetic Trees &#x02014; Nextstrain Documentation</collab></person-group>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://docs.nextstrain.org/en/latest/learn/interpret/how-to-read-a-tree.html">https://docs.nextstrain.org/en/latest/learn/interpret/how-to-read-a-tree.html</ext-link> (accessed September 12, 2021).</citation>
</ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koh</surname> <given-names>D</given-names></name></person-group>. <article-title>Migrant workers and COVID-19</article-title>. <source>Occup Environ Med.</source> (<year>2020</year>) <volume>77</volume>:<fpage>634</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1136/oemed-2020-106626</pub-id><pub-id pub-id-type="pmid">32513832</pub-id></citation></ref>
<ref id="B30">
<label>30.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Korber</surname> <given-names>B</given-names></name> <name><surname>Fischer</surname> <given-names>WM</given-names></name> <name><surname>Gnanakaran</surname> <given-names>S</given-names></name> <name><surname>Yoon</surname> <given-names>H</given-names></name> <name><surname>Theiler</surname> <given-names>J</given-names></name> <name><surname>Abfalterer</surname> <given-names>W</given-names></name> <etal/></person-group>. <article-title>Tracking changes in SARS-CoV-2 spike: evidence that D614G increases infectivity of the COVID-19 virus</article-title>. <source>Cell.</source> (<year>2020</year>) <volume>182</volume>:<fpage>812</fpage>&#x02013;<lpage>27</lpage>.e19. <pub-id pub-id-type="doi">10.1016/j.cell.2020.06.043</pub-id><pub-id pub-id-type="pmid">32697968</pub-id></citation></ref>
<ref id="B31">
<label>31.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>Center for Devices Radiological Health. Genetic Variants May Lead to False Negatives With SARS-CoV-2 Molecular.</collab></person-group> (<year>2021</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/medical-devices/letters-health-care-providers/genetic-variants-sars-cov-2-may-lead-false-negative-results-molecular-tests-detection-sars-cov-2">https://www.fda.gov/medical-devices/letters-health-care-providers/genetic-variants-sars-cov-2-may-lead-false-negative-results-molecular-tests-detection-sars-cov-2</ext-link> (accessed May 17, 2021).</citation>
</ref>
<ref id="B32">
<label>32.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>X</given-names></name> <name><surname>Wang</surname> <given-names>L</given-names></name> <name><surname>Sakthivel</surname> <given-names>SK</given-names></name> <name><surname>Whitaker</surname> <given-names>B</given-names></name> <name><surname>Murray</surname> <given-names>J</given-names></name> <name><surname>Kamili</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>US CDC real-time reverse transcription PCR panel for detection of severe acute respiratory syndrome coronavirus 2</article-title>. <source>Emerg Infect Dis.</source> (<year>2020</year>) <volume>26</volume>:<fpage>1654</fpage>&#x02013;<lpage>665</lpage>. <pub-id pub-id-type="doi">10.3201/eid2608.201246</pub-id><pub-id pub-id-type="pmid">32396505</pub-id></citation></ref>
<ref id="B33">
<label>33.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Deng</surname> <given-names>X</given-names></name> <name><surname>Garcia-Knight</surname> <given-names>MA</given-names></name> <name><surname>Khalid</surname> <given-names>MM</given-names></name> <name><surname>Servellita</surname> <given-names>V</given-names></name> <name><surname>Wang</surname> <given-names>C</given-names></name> <name><surname>Morris</surname> <given-names>MK</given-names></name> <etal/></person-group>. <article-title>Transmission, infectivity, and antibody neutralization of an emerging SARS-CoV-2 variant in California carrying a L452R spike protein mutation</article-title>. <source>medRxiv [Preprints]</source>. (<year>2021</year>). <pub-id pub-id-type="doi">10.1101/2021.03.07.21252647</pub-id><pub-id pub-id-type="pmid">33758899</pub-id></citation></ref>
<ref id="B34">
<label>34.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saito</surname> <given-names>A</given-names></name> <name><surname>Nasser</surname> <given-names>H</given-names></name> <name><surname>Uriu</surname> <given-names>K</given-names></name> <name><surname>Kosugi</surname> <given-names>Y</given-names></name> <name><surname>Irie</surname> <given-names>T</given-names></name> <name><surname>Shirakawa</surname> <given-names>K</given-names></name></person-group>. <article-title>SARS-CoV-2 spike P681R mutation enhances and accelerates viral fusion</article-title>. <source>bioRxiv [Preprints].</source> (<year>2021</year>). <pub-id pub-id-type="doi">10.1101/2021.06.17.448820</pub-id></citation>
</ref>
<ref id="B35">
<label>35.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cherian</surname> <given-names>S</given-names></name> <name><surname>Potdar</surname> <given-names>V</given-names></name> <name><surname>Jadhav</surname> <given-names>S</given-names></name> <name><surname>Yadav</surname> <given-names>P</given-names></name> <name><surname>Gupta</surname> <given-names>N</given-names></name> <name><surname>Das</surname> <given-names>M</given-names></name> <etal/></person-group>. <article-title>Convergent evolution of SARS-CoV-2 spike mutations, L452R, E484Q and P681R, in the second wave of COVID-19 in Maharashtra, India</article-title>. <source>bioRxiv [Preprints].</source> (<year>2021</year>). <pub-id pub-id-type="doi">10.1101/2021.04.22.440932</pub-id></citation>
</ref>
<ref id="B36">
<label>36.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ziegler</surname> <given-names>K</given-names></name> <name><surname>Steininger</surname> <given-names>P</given-names></name> <name><surname>Ziegler</surname> <given-names>R</given-names></name> <name><surname>Steinmann</surname> <given-names>J</given-names></name> <name><surname>Korn</surname> <given-names>K</given-names></name> <name><surname>Ensser</surname> <given-names>A</given-names></name></person-group>. <article-title>SARS-CoV-2 samples may escape detection because of a single point mutation in the N gene</article-title>. <source>Euro Surveill.</source> (<year>2020</year>) <volume>25</volume>:<fpage>2001650</fpage>. <pub-id pub-id-type="doi">10.2807/1560-7917.ES.2020.25.39.2001650</pub-id><pub-id pub-id-type="pmid">33006300</pub-id></citation></ref>
<ref id="B37">
<label>37.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gonz&#x000E1;lez-Recio</surname> <given-names>O</given-names></name> <name><surname>Guti&#x000E9;rrez-Rivas</surname> <given-names>M</given-names></name> <name><surname>Peir&#x000F3;-Pastor</surname> <given-names>R</given-names></name> <name><surname>Aguilera-Sep&#x000FA;lveda</surname> <given-names>P</given-names></name> <name><surname>Cano-G&#x000F3;mez</surname> <given-names>C</given-names></name> <name><surname>Jim&#x000E9;nez-Clavero</surname> <given-names>M&#x000C1;</given-names></name> <etal/></person-group>. <article-title>Sequencing of SARS-CoV-2 genome using different nanopore chemistries</article-title>. <source>Appl Microbiol Biotechnol.</source> (<year>2021</year>) <volume>105</volume>:<fpage>3225</fpage>&#x02013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1007/s00253-021-11250-w</pub-id><pub-id pub-id-type="pmid">33792750</pub-id></citation></ref>
<ref id="B38">
<label>38.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tyson</surname> <given-names>JR</given-names></name> <name><surname>James</surname> <given-names>P</given-names></name> <name><surname>Stoddart</surname> <given-names>D</given-names></name> <name><surname>Sparks</surname> <given-names>N</given-names></name> <name><surname>Wickenhagen</surname> <given-names>A</given-names></name> <name><surname>Hall</surname> <given-names>G</given-names></name> <etal/></person-group>. <article-title>Improvements to the ARTIC multiplex PCR method for SARS-CoV-2 genome sequencing using nanopore</article-title>. <source>bioRxiv [Preprints]</source>. (<year>2020</year>). <pub-id pub-id-type="doi">10.1101/2020.09.04.283077</pub-id><pub-id pub-id-type="pmid">32908977</pub-id></citation></ref>
<ref id="B39">
<label>39.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>A</given-names></name> <name><surname>Wang</surname> <given-names>L</given-names></name> <name><surname>Zhou</surname> <given-names>H-Y</given-names></name> <name><surname>Ji</surname> <given-names>C-Y</given-names></name> <name><surname>Xia</surname> <given-names>SZ</given-names></name> <name><surname>Cao</surname> <given-names>Y</given-names></name> <etal/></person-group>. <article-title>One year of SARS-CoV-2 evolution</article-title>. <source>Cell Host Microbe.</source> (<year>2021</year>) <volume>29</volume>:<fpage>503</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1016/j.chom.2021.02.017</pub-id><pub-id pub-id-type="pmid">33676588</pub-id></citation></ref>
<ref id="B40">
<label>40.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Plante</surname> <given-names>JA</given-names></name> <name><surname>Mitchell</surname> <given-names>BM</given-names></name> <name><surname>Plante</surname> <given-names>KS</given-names></name> <name><surname>Debbink</surname> <given-names>K</given-names></name> <name><surname>Weaver</surname> <given-names>SC</given-names></name> <name><surname>Menachery</surname> <given-names>VD</given-names></name></person-group>. <article-title>The variant gambit: COVID-19&#x00027;s next move</article-title>. <source>Cell Host &#x00026; Microbe.</source> (<year>2021</year>) <volume>29</volume>:<fpage>508</fpage>&#x02013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1016/j.chom.2021.02.020</pub-id><pub-id pub-id-type="pmid">33789086</pub-id></citation></ref>
<ref id="B41">
<label>41.</label>
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Hodcroft</surname> <given-names>E</given-names></name></person-group>. <article-title>CoVariants</article-title>. <source>CoVariants</source> Available online at: <ext-link ext-link-type="uri" xlink:href="https://covariants.org/">https://covariants.org/</ext-link> (accessed July 25, 2021). </citation>
</ref>
</ref-list> 
</back>
</article>