<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1352443</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2024.1352443</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Technology and Code</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>SVhawkeye: an ultra-fast software for user-friendly visualization of targeted structural fragments from BAM files</article-title>
<alt-title alt-title-type="left-running-head">Xiao et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2024.1352443">10.3389/fgene.2024.1352443</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Xiao</surname>
<given-names>Yuhui</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/633609/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Yu</surname>
<given-names>Tao</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2674827/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liang</surname>
<given-names>Fan</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/828194/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Hou</surname>
<given-names>Tingping</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2077052/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>The State Key Laboratory of Refractories and Metallurgy</institution>, <institution>Joint International Research Laboratory of Refractories and Metallurgy</institution>, <institution>Hubei Province Key Laboratory of Systems Science in Metallurgical Process</institution>, <institution>International Research Institute for Steel Technology</institution>, <institution>Collaborative Innovation Center for Advanced Steels</institution>, <institution>Wuhan University of Science and Technology</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>School of Optoelectronic Materials and Technology</institution>, <institution>Jianghan University</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>GrandOmics Biosciences</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1103229/overview">Xavier Sol&#xe9;</ext-link>, Hospital Clinic of Barcelona, Spain</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1563767/overview">Giltae Song</ext-link>, Pusan National University, Republic of Korea</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/760272/overview">Sheng Wang</ext-link>, University of California, San Francisco, United States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Tao Yu, <email>tyu@jhun.edu.cn</email>; Tingping Hou, <email>houtingping@wust.edu.cn</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>24</day>
<month>04</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1352443</elocation-id>
<history>
<date date-type="received">
<day>08</day>
<month>12</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>08</day>
<month>04</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Xiao, Yu, Liang and Hou.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Xiao, Yu, Liang and Hou</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>SVhawkeye is a novel visualization software created to rapidly extract essential structural information from third-generation sequencing data, such as data generated by PacBio or Oxford Nanopore Technologies. Its primary focus is on visualizing various structural variations commonly encountered in whole-genome sequencing (WGS) experiments, including deletions, insertions, duplications, inversions, and translocations. Additionally, SVhawkeye has the capability to display isoform structures obtained from iso-seq data and provides interval depth visualization for deducing local copy number variation (CNV). One noteworthy feature of SVhawkeye is its capacity to genotype structural variations, a critical function that enhances the accuracy of structural variant genotyping. SVhawkeye is an open-source software developed using Python and R languages, and it is freely accessible on GitHub (<ext-link ext-link-type="uri" xlink:href="https://github.com/yywan0913/SVhawkeye">https://github.com/yywan0913/SVhawkeye</ext-link>).</p>
</abstract>
<kwd-group>
<kwd>structural variations</kwd>
<kwd>data visualization</kwd>
<kwd>genotyping</kwd>
<kwd>third-generation sequencing</kwd>
<kwd>whole-genome sequencing</kwd>
<kwd>python and R software</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Computational Genomics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>The genetic variations in the human genome encompass a variety of categories, including numerical abnormalities of chromosomes, structural variation (SV) in chromosomes, copy number variation (CNV), single nucleotide variation (SNV), and insertion-deletion mutations (indels). Numerical abnormalities of chromosomes can result in conditions like trisomy syndrome, which can be identified through methods such as karyotyping or analyzing the depth distribution of all chromosomes (<xref ref-type="bibr" rid="B37">Santoro et al., 2020</xref>; <xref ref-type="bibr" rid="B38">Santoro et al., 2022</xref>).</p>
<p>SVs denote significant genomic alterations that typically span at least 50 base pairs (<xref ref-type="bibr" rid="B11">Duan et al., 2022</xref>). These genomic variants include inversions, balanced translocations, and genomic imbalances, which involve duplications, insertions, and deletions collectively referred to as DNA gains, losses, or rearrangements (<xref ref-type="bibr" rid="B43">Sudmant et al., 2015</xref>; <xref ref-type="bibr" rid="B40">Sedlazeck et al., 2018a</xref>). Whole-genome sequencing (WGS) from next-generation sequencing (NGS) or third-generation sequencing (TGS) data can detect these variants.</p>
<p>SVs are not only play an important role in gene expression (<xref ref-type="bibr" rid="B5">Chain and Feulner, 2014</xref>; <xref ref-type="bibr" rid="B6">Chiang et al., 2017</xref>) and phenotypic diversity (<xref ref-type="bibr" rid="B25">MacArthur et al., 2007</xref>; <xref ref-type="bibr" rid="B32">Perry et al., 2007</xref>; <xref ref-type="bibr" rid="B18">Jarvis et al., 2012</xref>; <xref ref-type="bibr" rid="B20">Kamberov et al., 2013</xref>). Numerous complex hereditary diseases, including autism (<xref ref-type="bibr" rid="B15">Hoischen et al., 2014</xref>; <xref ref-type="bibr" rid="B9">Dennis et al., 2017</xref>), cancer (<xref ref-type="bibr" rid="B45">Vogelstein et al., 2013</xref>; <xref ref-type="bibr" rid="B49">Zack et al., 2013</xref>), Alzheimer&#x2019;s disease (<xref ref-type="bibr" rid="B36">Roses, 2016</xref>), and schizophrenia (<xref ref-type="bibr" rid="B22">Klar, 2004</xref>; <xref ref-type="bibr" rid="B26">Marshall et al., 2017</xref>), are known to originate from structural variations in the genome. Examples of such variations encompass translocations and large deletions, significantly contributing to both cancer and hereditary diseases (<xref ref-type="bibr" rid="B2">Abeysinghe et al., 2006</xref>). Gene inversions also play a role in certain conditions, such as Hemophilia A (<xref ref-type="bibr" rid="B8">Dai et al., 2021</xref>). Moreover, Short Tandem Repeats (STRs) (<xref ref-type="bibr" rid="B27">Masters et al., 2001</xref>) and Variable Number of Tandem Repeats (VNTRs) (<xref ref-type="bibr" rid="B3">Bakhtiari et al., 2021</xref>), specific types of structural variations, have been extensively studied in connection with repeat expansions. For instance, ATTCC repeat expansions have been associated with Parkinson&#x2019;s disease (<xref ref-type="bibr" rid="B39">Sch&#xfc;le et al., 2017</xref>), and CAG expansions have been linked to Huntington&#x2019;s disease (<xref ref-type="bibr" rid="B28">McColgan and Tabrizi, 2018</xref>).</p>
<p>SNVs are the most common type of genetic variation in humans (<xref ref-type="bibr" rid="B21">Katsonis et al., 2014</xref>). They play a crucial role in phenotypic diversity. RNA splicing (<xref ref-type="bibr" rid="B47">Wilkinson et al., 2020</xref>), a significant biological process in eukaryotic gene expression, is frequently detected through RNA-seq or isoform sequencing (iso-seq). This process results in the creation of numerous functional mRNAs carrying coding information. CNV (<xref ref-type="bibr" rid="B48">Wong et al., 2007</xref>; <xref ref-type="bibr" rid="B13">Fanciulli et al., 2010</xref>), on the other hand, refers to variations in the number of copies of specific DNA segments across different individuals&#x2019; genomes, resulting from duplications, deletions, or other alterations, often indicated by changes in read depth in WGS or whole exome sequencing (WES).</p>
<p>To effectively detect SVs from long reads, numerous software packages have been developed using genomic sequence data. These tools, including sniffles (<xref ref-type="bibr" rid="B41">Sedlazeck et al., 2018b</xref>), cuteSV (<xref ref-type="bibr" rid="B19">Jiang et al., 2020</xref>), pbsv (<ext-link ext-link-type="uri" xlink:href="https://github.com/PacificBiosciences/pbsv">https://github.com/PacificBiosciences/pbsv</ext-link>), and svim (<xref ref-type="bibr" rid="B14">Heller and Vingron, 2019</xref>), provide valuable SV results but may still have limitations in accurately identifying specific target SVs. Detected SVs can contain inaccuracies or lack sufficient read support, requiring meticulous manual interpretation using Integrative Genomics Viewer (IGV) (<xref ref-type="bibr" rid="B35">Robinson et al., 2011</xref>; <xref ref-type="bibr" rid="B44">Thorvaldsdottir et al., 2013</xref>; <xref ref-type="bibr" rid="B34">Robinson et al., 2017</xref>; <xref ref-type="bibr" rid="B33">Robinson et al., 2020</xref>). This process is time-consuming and involves importing reference genomes and BAM files (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/sra/docs/submitformats/">https://www.ncbi.nlm.nih.gov/sra/docs/submitformats/</ext-link>), as well as constant manual adjustments to observe structure types and read mapping quality. Additionally, users may overlook SV types resulting from split-mapping.</p>
<p>Alternative tools such as bamsnap (<xref ref-type="bibr" rid="B23">Kwon et al., 2021</xref>) and svviz (<xref ref-type="bibr" rid="B42">Spies et al., 2015</xref>) provide automation, but are unable to handle long read data and can be slow (<xref ref-type="table" rid="T1">Table 1</xref>) and more detailed information may be needed to understand the presented SV structure (<xref ref-type="fig" rid="F2">Figure 2B</xref>, <xref ref-type="fig" rid="F5">Figure 5B</xref>). Samplot (<xref ref-type="bibr" rid="B4">Belyeu et al., 2021</xref>) offers a rapid overview of mutation structure but may obscure essential read information, making it difficult to discern precise genotyping details and missing nearby structural information. Even inaccurate SV length may occur (<xref ref-type="fig" rid="F3">Figure 3C</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Feature comparisons of currently available SV plot tools.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Software</th>
<th align="center">Variation type</th>
<th align="center">Variation type judgment</th>
<th align="center">Input format</th>
<th align="center">Speed (second/sv)</th>
<th align="center">Visual information reading</th>
<th align="center">SV genotyping/recall</th>
<th align="center">Supports long reads</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<bold>SVhawkeye</bold>
</td>
<td align="center">Fullly support<xref ref-type="table-fn" rid="Tfn1">
<sup>a</sup>
</xref>
</td>
<td align="center">auto</td>
<td align="center">bam &#x002B; vcf/bed</td>
<td align="center">3.29</td>
<td align="center">obvious<xref ref-type="table-fn" rid="Tfn4">
<sup>d</sup>
</xref>
</td>
<td align="center">yes</td>
<td align="center">yes</td>
</tr>
<tr>
<td align="center">
<bold>Samplot</bold>
</td>
<td align="center">Part<xref ref-type="table-fn" rid="Tfn2">
<sup>b</sup>
</xref>
</td>
<td align="center">specify</td>
<td align="center">bam &#x002B; vcf/pos</td>
<td align="center">2.41</td>
<td align="center">deliberative<xref ref-type="table-fn" rid="Tfn5">
<sup>e</sup>
</xref>
</td>
<td align="center">no</td>
<td align="center">yes</td>
</tr>
<tr>
<td align="center">
<bold>IGV</bold>
</td>
<td align="center">&#x2014;</td>
<td align="center">no</td>
<td align="center">bam &#x002B; pos</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">no</td>
<td align="center">yes</td>
</tr>
<tr>
<td align="center">
<bold>IGVScreenshot</bold>
</td>
<td align="center">&#x2014;</td>
<td align="center">no</td>
<td align="center">bam &#x002B; bed</td>
<td align="center">22.36</td>
<td align="center">complex<xref ref-type="table-fn" rid="Tfn6">
<sup>f</sup>
</xref>
</td>
<td align="center">no</td>
<td align="center">yes</td>
</tr>
<tr>
<td align="center">
<bold>Bamsnap</bold>
</td>
<td align="center">&#x2014;</td>
<td align="center">no</td>
<td align="center">bam &#x002B; vcf/bed/pos</td>
<td align="center">&#x2014;</td>
<td align="center">complex</td>
<td align="center">no</td>
<td align="center">no</td>
</tr>
<tr>
<td align="center">
<bold>Svviz2</bold>
</td>
<td align="center">part<xref ref-type="table-fn" rid="Tfn3">
<sup>c</sup>
</xref>
</td>
<td align="center">specify</td>
<td align="center">bam &#x002B; vcf/bcf</td>
<td align="center">31.03</td>
<td align="center">complex</td>
<td align="center">no</td>
<td align="center">no</td>
</tr>
<tr>
<td align="center">
<bold>Svviz</bold>
</td>
<td align="center">part<xref ref-type="table-fn" rid="Tfn3">
<sup>c</sup>
</xref>
</td>
<td align="center">specify</td>
<td align="center">bam &#x002B; pos</td>
<td align="center">35.55</td>
<td align="center">complex</td>
<td align="center">no</td>
<td align="center">no</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn1">
<label>
<sup>a</sup>
</label>
<p>DEL/INS/INV/DUP/TRA/SNV/InDel/CNV, e.g.</p>
</fn>
<fn id="Tfn2">
<label>
<sup>b</sup>
</label>
<p>DEL/INS/INV/DUP.</p>
</fn>
<fn id="Tfn3">
<label>
<sup>c</sup>
</label>
<p>DEL/INS/INV/TRA.</p>
</fn>
<fn id="Tfn4">
<label>
<sup>d</sup>
</label>
<p>Obvious: It is possible to simultaneously observe factors such as SV, type; SV, length, and SV, supported reads. (<xref ref-type="fig" rid="F2">Figure 2</xref>; <xref ref-type="fig" rid="F3">Figure 3</xref>; <xref ref-type="fig" rid="F4">Figure 4</xref>; <xref ref-type="fig" rid="F5">Figure 5</xref>; <xref ref-type="fig" rid="F6">Figure 6</xref>).</p>
</fn>
<fn id="Tfn5">
<label>
<sup>e</sup>
</label>
<p>deliberative: Missing partial information for SV, e.g., missing number of variant reads and even possible inaccurate variant length (<xref ref-type="fig" rid="F3">Figure 3</xref>).</p>
</fn>
<fn id="Tfn6">
<label>
<sup>f</sup>
</label>
<p>Complex: More information may be needed to confirm the displayed SV, type. (<xref ref-type="fig" rid="F2">Figure 2</xref>; <xref ref-type="fig" rid="F4">Figure 4</xref>; <xref ref-type="fig" rid="F5">Figure 5</xref>).</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In this paper, we introduce SVhawkeye, a novel software that addresses these aforementioned shortcomings. SVhawkeye offers a comprehensive suite of detection and visualization tools for SV curation. It enables the rapid generation of multiple SV graphs from VCF files simultaneously. SVhawkeye meticulously reviews and interprets each read, highlighting those that support target SVs. It can help quickly screen for pathogenic variants in clinical samples detected through third-generation sequencing. Moreover, SVhawkeye has the capability to concurrently exhibit various samples, encompassing family and population samples. It also accommodates the visualization of other genomic structural types like SNVs, RNA splicing, and CNV.</p>
</sec>
<sec id="s2" sec-type="methods">
<title>Methods</title>
<p>SVhawkeye undergoes several pre-processing steps to prepare data for visualization (<xref ref-type="fig" rid="F1">Figure 1A</xref>).<list list-type="simple">
<list-item>
<p>Step 1) Quality Assessment: Initially, SVhawkeye assesses the validity and quality of mapped reads, filtering out reads with insufficient evidence, Factors considered include low quality scores (default: mean reads quality &#x2265; Q20), low sequence identity (default: mapping identity &#x2265;60%), and short mapping lengths (default: remove reads with mapping length less than 100&#xa0;bp).</p>
</list-item>
<list-item>
<p>Step 2) Breakpoint Identification: SVhawkeye identifies breakpoints for each read based on cigar-mapping and split-mapping, utilizing the pysam package (<ext-link ext-link-type="uri" xlink:href="https://pysam.readthedocs.io/en/stable/">https://pysam.readthedocs.io/en/stable/</ext-link>) to read the BAM file. The cigar information is utilized to identify possible deletions, insertions, and soft clipping events. Split-reads are employed to gather breakpoint data, serving as a foundation for interpreting the SV sequence.</p>
</list-item>
<list-item>
<p>Step 3) SV Type Interpretation: SVhawkeye interprets SV types using mapping coordinate information, amalgamating the breakpoint data from all reads and predicting SV characteristics through common SV types (<xref ref-type="bibr" rid="B1">Abel et al., 2020</xref>) and a well-designed algorithm. This relevant breakpoint information is subsequently recorded. In this step, all reads are recorded after comparison with the reference in various types, which can be reference reads, deletions, insertions, duplications, inversions or translocation reads, along with the corresponding breakpoint information.</p>
</list-item>
<list-item>
<p>Step 4) Reads Rearrangement and Clustering: To visualize SV structures with significant intervals, SVhawkeye utilizes a greedy non-overlapping interval clustering algorithm (<ext-link ext-link-type="uri" xlink:href="https://labuladong.gitbook.io/algo-en/i.-dynamic-programming/intervalscheduling">https://labuladong.gitbook.io/algo-en/i.-dynamic-programming/intervalscheduling</ext-link>). This algorithm automatically arranges and assigns reads to each row in the graph, ensuring a visually appealing representation of SVs based on the previously acquired breakpoint information. Finally, plot these arranged coordinate information using the R language.</p>
</list-item>
<list-item>
<p>Step 5) SV Genotyping: SVhawkeye ascertains SV genotypes by scrutinizing the breakpoint information of reads that corroborate the specific SV within the interval relative to the target SV interval. This procedure entails excluding reads with coverage below 0.5 and breakpoint position disparities surpassing 1000, then removing reads with effective comparison length less than 100bp in this region. After reordering the reads in the step 4, the depth value also becomes more reasonable. Following this, SVhawkeye consolidates and computes the allele frequency (AF) value. A genotype of 0/1 is assigned when the AF value exceeds 0.3, while it is designated as 1/1 if the AF value surpasses 0.8.</p>
</list-item>
</list>
</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The overall workflow of SVhawkeye. <bold>(A)</bold> Data processing of SVhawkeye. <bold>(B)</bold> The SVhawkeye tool provides five modules, the first four modules can be used independently to graphically display gene variation information, and the last module can be used for SV genotyping. The input file displays that all modules require BAM file(s) and coordinate information for use.</p>
</caption>
<graphic xlink:href="fgene-15-1352443-g001.tif"/>
</fig>
<sec id="s2-1">
<title>Workflow of SVhawkeye</title>
<p>The main &#x2018;hawkeye.py&#x2019; function comprises five subroutines: &#x2018;sv_browse,&#x2019; &#x2018;snpindel_browse,&#x2019; &#x2018;rna_browse,&#x2019; &#x2018;regiondepth_browse,&#x2019; and &#x2018;sv_genotyping.&#x2019; All of these subroutines require input in the form of BAM files and interval information, such as BED/VCF files or interval strings (<xref ref-type="fig" rid="F1">Figure 1B</xref>).</p>
</sec>
<sec id="s2-2">
<title>Moduel &#x23;1 sv_browse</title>
<p>The &#x2018;hawkeye.py sv_browse&#x2019; command is used to visualize structural variants within a specified interval, sourced from either a BED or VCF file. Firstly, the graphical layout and details closely resemble those of the IGV software. &#x2018;sv_browse&#x2019; offers the advantage of automatically identifying SV types from cigar-mapping and split-mapping reads. Furthermore, this software provides support for multiple sample files and facilitates the batch plotting of multiple intervals. Additionally, it demonstrates proficiency in presenting extensive intervals in a user-friendly fashion. It intelligently selects reads for display when confronted with an excessive quantity of fragments. This approach enables users to quickly assess the reliability of the target variant for subsequent analysis.</p>
<p>The using method of sv_browse command is as follows:</p>
<p>
<monospace>hawkeye.py sv_browse -i $bam -b $input.vcf -f vcf --thread $cpu -o $outdir --genome hg19 --quanlty 20 --sv_min_length 50 -F png</monospace>
</p>
<p>or</p>
<p>
<monospace>hawkeye.py sv_browse -i $bam -b $input.bed -f bed --thread $cpu -o $outdir --genome hg38 --quanlty 20 --sv_min_length 50 -F pdf</monospace>
</p>
</sec>
<sec id="s2-3">
<title>Moduel &#x23;2 snpindel_browse</title>
<p>The &#x2018;hawkeye.py snpindel_browse&#x2019; command is utilized to visualize SNVs or indel structures from sequencing data. Its usage closely mirrors that of &#x201c;sv_browse,&#x201d; and users have the option to specify a reference FASTA file using &#x201c;-r $ref.fa&#x201d; to display reference bases. This feature is very user-friendly for intervals less than 200bp.</p>
</sec>
<sec id="s2-4">
<title>Moduel &#x23;3 regiondepth_browse</title>
<p>The &#x201c;hawkeye.py regiondepth_browse&#x201d; command is utilized to quickly visualize the depth of a region within a specific segment of the genome, especially in areas where deletions or duplications are present.</p>
<p>The using method of regiondepth_browse command is as follows:</p>
<p>
<monospace>hawkeye.py regiondepth_browse -i $bam -o $outdir -r ${chrom:start-end}</monospace>
</p>
</sec>
<sec id="s2-5">
<title>Moduel &#x23;4 rna_browse</title>
<p>The &#x201c;hawkeye.py rna_browse&#x201d; command is used to visualize isoform structures obtained from RNA-seq or iso-seq data. Users need to provide a BED file containing the target interval and a GenePred (<xref ref-type="bibr" rid="B17">Hubisz and Siepel, 2023</xref>) file if the input species is not human.</p>
<p>The using method of rna_browse command is as follows:</p>
<p>
<monospace>hawkeye.py rna_browse -i $bam -b $inputbed -g $genome -t $cpu -o $outdir --genepred genome.genePred.gz</monospace>
</p>
</sec>
<sec id="s2-6">
<title>Moduel &#x23;5 sv_genotyping</title>
<p>The &#x201c;hawkeye.py sv_genotyping&#x201d; command is employed to swiftly perform genotyping of structural variants using an accurate force-calling method.</p>
<p>The using method of sv_genotyping command is as follows:</p>
<p>
<monospace>hawkeye.py sv_genotyping -i $bam -b $vcf -f vcf -o $outdir -t $cpu</monospace>
</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<p>
<xref ref-type="table" rid="T1">Table 1</xref> presents a comprehensive comparison between SVhawkeye and commonly used SV plotting tools currently available. SVhawkeye boasts the following advantages.<list list-type="simple">
<list-item>
<p>1. Easy to Get Started: SVhawkeye is not required to install on personal computer, and includes an efficient matching annotation database. Users can operate it with a friendly one-click command-line operations, and only requires input the bam(s) and coordinate file (vcf/bed) (refer to <xref ref-type="table" rid="T1">Table 1</xref> Input format column).</p>
</list-item>
<list-item>
<p>2. Diversification: SVhawkeye supports multi-threading capabilities, and has the ability to display and compare multiple samples simultaneously.</p>
</list-item>
<list-item>
<p>3. Support for Displaying Very Large Intervals: SVhawkeye excels in presenting data across extensive intervals. It organizes reads for an orderly arrangement and provides depth information simultaneously (<xref ref-type="fig" rid="F2">Figure 2A</xref>). When handling an abundance of fragments, SVhawkeye intelligently selects a subset of reads for display, ensuring efficient visualization.</p>
</list-item>
<list-item>
<p>4. Automatic Variation Type Identification: In contrast to tools like Samplot and Svviz that require specifying SV types. SVhawkeye automatically identifies SV types based on coordinate information. It can highlight split-mapping reads and determined all SV types of reads within the interval, and marking their lengths numerically. (refer to <xref ref-type="table" rid="T1">Table 1</xref> variation type judgment column).</p>
</list-item>
<list-item>
<p>5. Support for Displaying All Variation Types: SVhawkeye stands out by providing essential functionality for displaying all variation types, including deletion (<xref ref-type="fig" rid="F2">Figure 2</xref>), insertion (<xref ref-type="fig" rid="F3">Figure 3</xref>), duplication (<xref ref-type="fig" rid="F4">Figure 4</xref>), inversion (<xref ref-type="fig" rid="F5">Figure 5</xref>), balanced translocations (<xref ref-type="fig" rid="F6">Figure 6</xref>) etc. This feature distinguishes it from other tools lacking this capability. (refer to <xref ref-type="table" rid="T1">Table 1</xref> variation type column).</p>
</list-item>
<list-item>
<p>6. Speediness: The speed of SVhawkeye is at the forefront of ensuring more information and accuracy. The average drawing time per SV on Ubantu 18.04 LTS is approximately 3.29&#xa0;s, only about 1&#xa0;s slower than the Samplot tool (refer to <xref ref-type="table" rid="T1">Table 1</xref> Speed column). On this basis, we also tested the performance of SVhawkeye on other aspects, the memory it occupies is related to the length and depth of the interval, usually not exceeding 1&#xa0;g (RAM), which can be satisfied by a personal computer (refer to <xref ref-type="table" rid="T2">Table 2</xref>).</p>
</list-item>
<list-item>
<p>7. SV Genotyping: Due to SVhawkeye&#x2019;s ability to determine the SV type for each read, SV genotyping is one of its strengths. However, SVhawkeye is better suited for long read sequencing. (refer to <xref ref-type="table" rid="T1">Table 1</xref> SV genotyping and Supports long reads columns).</p>
</list-item>
</list>
</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Display of deletion. <bold>(A)</bold> SVhawkeye. When reads are split-mapping, the colored dotted lines represent gaps, reads are aligned to both ends, and the purple number in the middle indicates the deletion length. When cigar-mapping, reads are linked by solid line. <bold>(B)</bold> Bamsnap.</p>
</caption>
<graphic xlink:href="fgene-15-1352443-g002.tif"/>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Display of insertion. <bold>(A)</bold> IGV. <bold>(B)</bold> SVhawkeye. When reads are split-mapping, they would be colored, and cigar-mapping would not be. The purple number in the middle indicates the insertion length. The red breakpoint at the end indicates soft-clipping which indicates that the reads may be too short to display an incomplete insert frequently. <bold>(C)</bold> Samplot.</p>
</caption>
<graphic xlink:href="fgene-15-1352443-g003.tif"/>
</fig>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Display of duplication. <bold>(A)</bold> IGV. <bold>(B)</bold> SVhawkeye. Split-mapping reads are colored, and the black number in the middle of the breakpoint indicates the length of duplication.</p>
</caption>
<graphic xlink:href="fgene-15-1352443-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Display of inversion. It is caused by two breaks in the same chromosome, and the resulting pieces are reversed 180&#xb0; and reconnected. <bold>(A)</bold> SVhawkeye. <bold>(B)</bold> Svviz</p>
</caption>
<graphic xlink:href="fgene-15-1352443-g005.tif"/>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Display of balanced translocation. Two chromosomes from different sources are broken and then reconnected with each other to form two rearranged chromosomes in structure. The example data of balanced translocation are from NCBI (PRJNA559962) (<xref ref-type="bibr" rid="B16">Hu et al., 2020</xref>) and select the sample of SRR9982132. <bold>(A)</bold> Ribbon. <bold>(B)</bold> SVhawkeye.</p>
</caption>
<graphic xlink:href="fgene-15-1352443-g006.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Drawing efficiency of 1000 randomly selected SVs.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">SVTYPE</th>
<th align="center">SV counts</th>
<th align="center">Max Len (/bp)</th>
<th align="center">Threads</th>
<th align="center">Max Memory (/M)</th>
<th align="center">Run time (s)</th>
<th align="center">Average time (/SV/thread)<xref ref-type="table-fn" rid="Tfn7">
<sup>a (s)</sup>
</xref>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">DEL</td>
<td align="center">437</td>
<td align="center">61,031</td>
<td align="center">4</td>
<td align="center">15.2</td>
<td align="center">26m19.34</td>
<td align="center">3.61</td>
</tr>
<tr>
<td align="center">INS</td>
<td align="center">516</td>
<td align="center">5,279</td>
<td align="center">4</td>
<td align="center">9.8</td>
<td align="center">25m20.07</td>
<td align="center">2.95</td>
</tr>
<tr>
<td align="center">INV</td>
<td align="center">47</td>
<td align="center">11,660</td>
<td align="center">4</td>
<td align="center">11.4</td>
<td align="center">3m12.27</td>
<td align="center">4.09</td>
</tr>
<tr>
<td align="center">ALL</td>
<td align="center">1,000</td>
<td align="center">61,031</td>
<td align="center">4</td>
<td align="center">15.2</td>
<td align="center">54m51.68</td>
<td align="center">3.29</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn7">
<label>
<sup>a</sup>
</label>
<p>Use Ubuntu 18.04 LTS, in DELL, Latitude 3510.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In our visualization results example, all the data is obtained from Genome in a Bottle (GIAB) (<xref ref-type="bibr" rid="B30">Nature, 2015</xref>). <xref ref-type="fig" rid="F2">Figure 2</xref> shows a deletion variation with a length of more than 85&#xa0;K bp. SVhawkeye can quickly identify the mutation type, mutation length and the number of reads <xref ref-type="sec" rid="s10">Supplementary Material</xref> (<xref ref-type="fig" rid="F2">Figure 2A</xref>). Although Bamsnap is also a fast IGV-drawing based screenshot, it may require more information to support the displayed structural types. As it is only applicable to short reads and paired-end reads, it can quickly browse depth distribution information for NGS data (<xref ref-type="fig" rid="F2">Figure 2B</xref>). <xref ref-type="fig" rid="F3">Figure 3</xref> is a comparison chart of insertion variation with a length of about 1.6&#xa0;K. IGV (<xref ref-type="fig" rid="F3">Figure 3A</xref>) can display the cigar-mapped insertion in a friendly way, with the insertion length matching the length in SVhawkeye. However, it is not easy to visualise insertions caused by split-mapping reads present in soft-clipping (represented by red triangles at one or both ends of the reads). Insertion in IGV lacks support for two reads coloured by SVhawkeye (<xref ref-type="fig" rid="F3">Figure 3B</xref>). The depth information is ignored in samplot (<xref ref-type="fig" rid="F3">Figure 3C</xref>) and there is a situation of fuzzy SV length (2&#xa0;K). <xref ref-type="fig" rid="F4">Figure 4</xref> shows a DUP mutation with a length of more than 10&#xa0;Kbp. As described in <xref ref-type="fig" rid="F3">Figure 3A</xref>, if the mutation region is too long, the split-mapping reads make it difficult for IGV to display the SV type (<xref ref-type="fig" rid="F4">Figure 4A</xref>) and may need to be interpreted by manually concatenating the included soft-clipping reads. SVhawkeye does not require these complex manual operations (<xref ref-type="fig" rid="F4">Figure 4B</xref>). In the INV mutation example, SVhawkeye clearly shows the change in read alignment strand caused by the inversion (<xref ref-type="fig" rid="F5">Figure 5A</xref>). The Svviz plot is difficult to understand for a while, but its presentation style is worth learning (<xref ref-type="fig" rid="F5">Figure 5B</xref>). Finally, in the TRA example, SVhawkeye achieved a unique display compared to the aforementioned software, supporting reads at both ends of the breakpoint of the two chromosomes undergoing balanced translocation (<xref ref-type="fig" rid="F6">Figure 6B</xref>). Of course, the Ribbon software (<xref ref-type="bibr" rid="B29">Nattestad et al., 2021</xref>) also supports this type of display (<xref ref-type="fig" rid="F6">Figure 6A</xref>), but it cannot use command line operations and batch operations, so no detailed comparison was made.</p>
<p>In conclusion, SVhawkeye has a speed no lower than other software, and many easily understood factors have been added to the graph results, including SV type, SV length and SV read support. It can display the SV type with highlighted reads and record the SV length numerically. Samplot is fast and the graphs are clear and concise, but it may miss some important factors of SV, such as SV allele frequency, and may even give unreliable SV length. After all, for clinical samples, many detailed features need to be considered. The only drawback of IGV, as a commonly used software in the field of bioinformatics, is that it requires cumbersome steps to import bam file and adjust the reads to achieve the purpose of displaying specific mutation information. If the interval is large, it is difficult to display in IGV. Fortunately, Bamsnap and Svviz are more suitable for next-generation sequencing and are good at quickly displaying alignment information for short reads intervals. (refer to <xref ref-type="table" rid="T1">Table1</xref> Visual information reading column).</p>
<p>At the bottom of the structural diagram, gene annotations content has been added, including gene name, repeatmaker and genomicSuperDups database information (<xref ref-type="bibr" rid="B46">Wang et al., 2010</xref>), provide valuable insights into the annotation of the breakpoint location.</p>
<p>In addition, SVhawkeye distinguishes itself by incorporating features such as SNP, InDel, RNA splicing, and CNV visualization, which are not present in other tools. In the SNP and InDel diagram (<xref ref-type="sec" rid="s10">Supplementary Figure S1</xref>), users can conveniently access information for each base within the reads and include details about the reference sequence beneath the reads. The RNA splicing diagram (<xref ref-type="sec" rid="s10">Supplementary Figure S2</xref>) enables users to specify a gene interval for visualizing its isoform structure, detected from iso-seq or full-length single-cell transcriptome data. The CNV plot (<xref ref-type="sec" rid="s10">Supplementary Figure S3</xref>) requires users to input an interval to display the depth distribution of reads, facilitating the identification of the coverage range of the target area.</p>
<p>The genotyping feature is an essential component of SVhawkeye, contributing significantly to the accuracy of SV genotyping (<xref ref-type="fig" rid="F7">Figure 7</xref>). We utilized HG002 HiFi data for initial SV detection, employing tools such as sniffles and cute SV. Subsequently, we employed truvari (<xref ref-type="bibr" rid="B12">English et al., 2022</xref>) to compare SVhawkeye&#x2019;s recall SV results with the initial SVs using the GIAB Tier1 v0.6 benchmark data (<xref ref-type="bibr" rid="B50">Zook et al., 2020</xref>). This analysis revealed a substantial improvement in genotype prediction accuracy, increasing from 31.6123% to 46.8814% for the sniffles results and from 90.8312% to 91.0554% for the cute SV results. Furthermore, the recall rate improved from 73.4472% to 85.6892% for the sniffles results and from 94.5167% to 94.75% for the cute SV results.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Comparison of accuracy of SV genotyping. <bold>(A)</bold> Genotyping from SVhawkeye compare to sniffles. <bold>(B)</bold> Genotyping from SVhawkeye compare to CuteSV.</p>
</caption>
<graphic xlink:href="fgene-15-1352443-g007.tif"/>
</fig>
</sec>
<sec id="s4">
<title>Discussion and applications</title>
<p>In summary, the SVhawkeye software takes inspiration from the layout of IGV and aims to provide a swift, comprehensive visualization of structural variants. It automates the interpretation of read data and presents it in a meaningful and visually intuitive manner. This improved clarity and user-friendliness greatly streamline both the sequencing process and data interpretation, saving valuable time for biomedical researchers.</p>
<p>With SVhawkeye&#x2019;s assistance, users can rapidly identify target regions across multiple disease samples, trio or pedigree samples, and more. For instance, SVhawkeye accurately detects balanced translocations, as demonstrated in various studies, including those referenced in PMC8804325 (<xref ref-type="bibr" rid="B31">Pei et al., 2022</xref>), benchmark structural variant research (<xref ref-type="bibr" rid="B10">Du et al., 2022</xref>), and population short tandem repeat counts, as verified in PMC9117641 (<xref ref-type="bibr" rid="B24">Liu et al., 2022</xref>). SVhawkeye is well-suited for detecting structural variants in clinical samples generated from PacBio or Oxford Nanopore sequencing. Of course, it is also suitable for other species and requires screening for more accurate variations, such as population variation analysis.</p>
<p>It is worth noting that while SVhawkeye offers valuable features, certain challenges in the sv_genotyping aspect, such as false-positive issues, remain unaddressed. These challenges include concerns such as read correction, breakpoint fragment realignment, and local assembly checking. Therefore, there is significant potential for future enhancements in the sv_genotyping component of SVhawkeye.</p>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>YX: Writing&#x2013;review and editing, Resources, Software, Visualization, Writing&#x2013;original draft. TY: Writing&#x2013;original draft, Investigation. FL: Conceptualization, Methodology, Writing&#x2013;review and editing. TH: Funding acquisition, Project administration, Supervision, Writing&#x2013;review and editing.</p>
</sec>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>This work is supported by the Natural Science Foundation of Hubei Province (No. 2022CFB474), Research Project of Jianghan University (No. 2021yb026), the National Natural Science Foundation of China (No. 12174296), Hubei Province "JD" Technology Research Project (No. 2023BAA019-5), the Key Research and Development Program of Hubei Province (No. 2021BAA057) and the 111 Project (No. D18018).</p>
</sec>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>FL was employed by the company GrandOmics Biosciences.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2024.1352443/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2024.1352443/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Image3.JPEG" id="SM1" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image1.JPEG" id="SM2" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image4.JPEG" id="SM3" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image2.JPEG" id="SM4" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.PDF" id="SM5" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abel</surname>
<given-names>H. J.</given-names>
</name>
<name>
<surname>Larson</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Regier</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Chiang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Kanchi</surname>
<given-names>K. L.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Mapping and characterization of structural variation in 17,795 human genomes</article-title>. <source>Nature</source> <volume>583</volume> (<issue>7814</issue>), <fpage>83</fpage>&#x2013;<lpage>89</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-020-2371-0</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abeysinghe</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Chuzhanova</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Cooper</surname>
<given-names>D. N.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Gross deletions and translocations in human genetic disease</article-title>. <source>Genome Dyn.</source> <volume>1</volume>, <fpage>17</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1159/000092498</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bakhtiari</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Shleizer-Burko</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Neuhausen</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Halld&#xf3;rsson</surname>
<given-names>B. V.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Variable number tandem repeats mediate the expression of proximal genes</article-title>. <source>Nat. Commun.</source> <volume>12</volume> (<issue>1</issue>), <fpage>2075</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-021-22206-z</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Belyeu</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Chowdhury</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pedersen</surname>
<given-names>B. S.</given-names>
</name>
<name>
<surname>Cormier</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Quinlan</surname>
<given-names>A. R.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Samplot: a platform for structural variant visual validation and automated filtering</article-title>. <source>Genome Biol.</source> <volume>22</volume> (<issue>1</issue>), <fpage>161</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-021-02380-5</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chain</surname>
<given-names>F. J.</given-names>
</name>
<name>
<surname>Feulner</surname>
<given-names>P. G.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Ecological and evolutionary implications of genomic structural variations</article-title>. <source>Front. Genet.</source> <volume>5</volume>, <fpage>326</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2014.00326</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chiang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Scott</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Tsang</surname>
<given-names>E. K.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>The impact of structural variation on human gene expression</article-title>. <source>Nat. Genet.</source> <volume>49</volume> (<issue>5</issue>), <fpage>692</fpage>&#x2013;<lpage>699</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3834</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dai</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kong</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Analysis of gene inversion in Hemophilia A by Nanopore sequencing</article-title>. <source>Chin. J. Med. Genet.</source> <volume>38</volume> (<issue>6</issue>), <fpage>521</fpage>&#x2013;<lpage>525</lpage>. <pub-id pub-id-type="doi">10.3760/cma.j.cn511374-20200630-00481</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dennis</surname>
<given-names>M. Y.</given-names>
</name>
<name>
<surname>Harshman</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Nelson</surname>
<given-names>B. J.</given-names>
</name>
<name>
<surname>Penn</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Cantsilieris</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Huddleston</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>The evolution and population diversity of human-specific segmental duplications</article-title>. <source>Nat. Ecol. Evol.</source> <volume>1</volume> (<issue>3</issue>), <fpage>69</fpage>. <pub-id pub-id-type="doi">10.1038/s41559-016-0069</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Du</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Robust benchmark structural variant calls of an asian using state-of-the-art long-read sequencing technologies</article-title>. <source>Genomics, proteomics, Bioinforma.</source> <volume>20</volume> (<issue>1</issue>), <fpage>192</fpage>&#x2013;<lpage>204</lpage>. <pub-id pub-id-type="doi">10.1016/j.gpb.2020.10.006</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Duan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Comprehensive evaluation of structural variant genotyping methods based on long-read sequencing data</article-title>. <source>BMC Genomics</source> <volume>23</volume>, <fpage>324</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-022-08548-y</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>English</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Menon</surname>
<given-names>V. K.</given-names>
</name>
<name>
<surname>Gibbs</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Metcalf</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Sedlazeck</surname>
<given-names>F. J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Truvari: refined structural variant comparison preserves allelic diversity</article-title>. <source>Genome Biol.</source> <volume>23</volume>, <fpage>271</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-022-02840-6</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fanciulli</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Petretto</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Aitman</surname>
<given-names>T. J.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Gene copy number variation and common human disease</article-title>. <source>Clin. Genet.</source> <volume>77</volume> (<issue>3</issue>), <fpage>201</fpage>&#x2013;<lpage>213</lpage>. <pub-id pub-id-type="doi">10.1111/j.1399-0004.2009.01342.x</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heller</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Vingron</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>SVIM: structural variant identification using mapped long reads</article-title>. <source>Bioinformatics</source> <volume>35</volume>, <fpage>2907</fpage>&#x2013;<lpage>2915</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz041</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoischen</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Krumm</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Eichler</surname>
<given-names>E. E.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Prioritization of neurodevelopmental disease genes by discovery of new mutations</article-title>. <source>Nat. Neurosci.</source> <volume>17</volume> (<issue>6</issue>), <fpage>764</fpage>&#x2013;<lpage>772</lpage>. <pub-id pub-id-type="doi">10.1038/nn.3703</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Zha</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Location of balanced chromosome-translocation breakpoints by long-read sequencing on the Oxford Nanopore platform</article-title>. <source>Front. Genet.</source> <volume>10</volume>, <fpage>1313</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2019.01313</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Hubisz</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Siepel</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Read a feature file (GFF, BED, or GenePred)</article-title>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://rdrr.io/cran/rphast/man/read.feat.html">https://rdrr.io/cran/rphast/man/read.feat.html</ext-link>.</comment>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jarvis</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Scheinfeldt</surname>
<given-names>L. B.</given-names>
</name>
<name>
<surname>Soi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lambert</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Omberg</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ferwerda</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Patterns of ancestry, signatures of natural selection, and genetic association with stature in Western African pygmies</article-title>. <source>PLoS Genet.</source> <volume>8</volume> (<issue>4</issue>), <fpage>e1002641</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1002641</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cui</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Long-read-based human genomic structural variation detection with cuteSV</article-title>. <source>Genome Biol.</source> <volume>21</volume> (<issue>1</issue>), <fpage>189</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-020-02107-y</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kamberov</surname>
<given-names>Y. G.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gerbault</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wark</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Modeling recent human evolution in mice by expression of a selected EDAR variant</article-title>. <source>Cell</source> <volume>152</volume> (<issue>4</issue>), <fpage>691</fpage>&#x2013;<lpage>702</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2013.01.016</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Katsonis</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Koire</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wilson</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Hsu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Lua</surname>
<given-names>R. C.</given-names>
</name>
<name>
<surname>Wilkins</surname>
<given-names>A. D.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Single nucleotide variations: biological impact and theoretical interpretation</article-title>. <source>Protein Sci.</source> <volume>23</volume> (<issue>12</issue>), <fpage>1650</fpage>&#x2013;<lpage>1666</lpage>. <pub-id pub-id-type="doi">10.1002/pro.2552</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Klar</surname>
<given-names>A. J. S.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>A genetic mechanism implicates chromosome 11 in schizophrenia and bipolar diseases</article-title>. <source>Genetics</source> <volume>167</volume> (<issue>4</issue>), <fpage>1833</fpage>&#x2013;<lpage>1840</lpage>. <pub-id pub-id-type="doi">10.1534/genetics.104.028217</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kwon</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Berselli</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>P. J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>BamSnap: a lightweight viewer for sequencing reads in BAM files</article-title>. <source>Bioinformatics</source> <volume>37</volume> (<issue>2</issue>), <fpage>263</fpage>&#x2013;<lpage>264</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btaa1101</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yuan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Profiling the genome-wide landscape of short tandem repeats by long-read sequencing</article-title>. <source>Front. Genet.</source> <volume>13</volume>, <fpage>810595</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2022.810595</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>MacArthur</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Seto</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Raftery</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Quinlan</surname>
<given-names>K. G.</given-names>
</name>
<name>
<surname>Huttley</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Hook</surname>
<given-names>J. W.</given-names>
</name>
<etal/>
</person-group> (<year>2007</year>). <article-title>Loss of ACTN3 gene function alters mouse muscle metabolism and shows evidence of positive selection in humans</article-title>. <source>Nat. Genet.</source> <volume>39</volume> (<issue>10</issue>), <fpage>1261</fpage>&#x2013;<lpage>1265</lpage>. <pub-id pub-id-type="doi">10.1038/ng2122</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marshall</surname>
<given-names>C. R.</given-names>
</name>
<name>
<surname>Howrigan</surname>
<given-names>D. P.</given-names>
</name>
<name>
<surname>Merico</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Thiruvahindrapuram</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Greer</surname>
<given-names>D. S.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Contribution of copy number variants to schizophrenia from a genome-wide study of 41,321 subjects</article-title>. <source>Nat. Genet.</source> <volume>49</volume> (<issue>1</issue>), <fpage>27</fpage>&#x2013;<lpage>35</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3725</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Masters</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Thomson</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Daly-Burns</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Reid</surname>
<given-names>Y. A.</given-names>
</name>
<name>
<surname>Dirks</surname>
<given-names>W. G.</given-names>
</name>
<name>
<surname>Packer</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2001</year>). <article-title>Short tandem repeat profiling provides an international reference standard for human cell lines</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>98</volume> (<issue>14</issue>), <fpage>8012</fpage>&#x2013;<lpage>8017</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.121616198</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McColgan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Tabrizi</surname>
<given-names>S. J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Huntington&#x2019;s disease: a clinical review</article-title>. <source>Eur. J. Neurology</source> <volume>25</volume> (<issue>1</issue>), <fpage>24</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1111/ene.13413</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nattestad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Aboukhalil</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Chin</surname>
<given-names>C. S.</given-names>
</name>
<name>
<surname>Schatz</surname>
<given-names>M. C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Ribbon: intuitive visualization for complex genomic variation</article-title>. <source>Bioinforma. Oxf. Engl.</source> <volume>37</volume> (<issue>3</issue>), <fpage>413</fpage>&#x2013;<lpage>415</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btaa680</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<collab>Nature</collab> (<year>2015</year>). <article-title>Genome in a bottle&#x2014;a human DNA standard</article-title>. <source>Nat. Biotechnol.</source> <volume>33</volume> (<issue>7</issue>), <fpage>675</fpage>. <pub-id pub-id-type="doi">10.1038/nbt0715-675a</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pei</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Lei</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Identifying balanced chromosomal translocations in human embryos by oxford nanopore sequencing and breakpoints region analysis</article-title>. <source>Front. Genet.</source> <volume>12</volume>, <fpage>810900</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2021.810900</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perry</surname>
<given-names>G. H.</given-names>
</name>
<name>
<surname>Dominy</surname>
<given-names>N. J.</given-names>
</name>
<name>
<surname>Claw</surname>
<given-names>K. G.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Fiegler</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Redon</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2007</year>). <article-title>Diet and the evolution of human amylase gene copy number variation</article-title>. <source>Nat. Genet.</source> <volume>39</volume> (<issue>10</issue>), <fpage>1256</fpage>&#x2013;<lpage>1260</lpage>. <pub-id pub-id-type="doi">10.1038/ng2123</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robinson</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Thorvaldsd&#xf3;ttir</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Turner</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Mesirov</surname>
<given-names>J. P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>igv.jus: an embeddable JavaScript implementation of the Integrative Genomics Viewer (IGV)</article-title>. <source>Bioinformatics</source>. <pub-id pub-id-type="doi">10.1101/2020.05.03.075499</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robinson</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Thorvaldsd&#xf3;ttir</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wenger</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Zehir</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mesirov</surname>
<given-names>J. P.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Variant review with the integrative genomics viewer</article-title>. <source>Cancer Res.</source> <volume>77</volume> (<issue>21</issue>), <fpage>e31</fpage>&#x2013;<lpage>e34</lpage>. <pub-id pub-id-type="doi">10.1158/0008-5472.can-17-0337</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robinson</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Thorvaldsd&#xf3;ttir</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Winckler</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Guttman</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lander</surname>
<given-names>E. S.</given-names>
</name>
<name>
<surname>Getz</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Integrative genomics viewer</article-title>. <source>Nat. Biotechnol.</source> <volume>29</volume> (<issue>1</issue>), <fpage>24</fpage>&#x2013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1754</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roses</surname>
<given-names>A. D.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Polyallelic structural variants can provide accurate, highly informative genetic markers focused on diagnosis and therapeutic targets: accuracy vs. Precision</article-title>. <source>Clin. Pharmacol. Ther.</source> <volume>99</volume> (<issue>2</issue>), <fpage>169</fpage>&#x2013;<lpage>171</lpage>. <pub-id pub-id-type="doi">10.1002/cpt.288</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Santoro</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Pagarkar</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Rosso</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Paulsen</surname>
<given-names>K. C.</given-names>
</name>
<name>
<surname>Levitt</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Neurologic complications of Down syndrome: a systematic review</article-title>. <source>J. Neurology</source> <volume>268</volume>, <fpage>4495</fpage>&#x2013;<lpage>4509</lpage>. <pub-id pub-id-type="doi">10.1007/s00415-020-10179-w</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Santoro</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Partridge</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Tanna</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Pagarkar</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Khoshnood</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rehmani</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Evidence of neuroinflammation and immunotherapy responsiveness in individuals with down syndrome regression disorder</article-title>. <source>J. Neurodev. Disord.</source> <volume>14</volume> (<issue>1</issue>), <fpage>35</fpage>. <pub-id pub-id-type="doi">10.1186/s11689-022-09446-w</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sch&#xfc;le</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>McFarland</surname>
<given-names>K. N.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Tsai</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Nguyen</surname>
<given-names>K. D.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Parkinson&#x2019;s disease associated with pure ATXN10 repeat expansion</article-title>. <source>npj Parkinson&#x27;s Dis.</source> <volume>3</volume> (<issue>1</issue>), <fpage>27</fpage>. <pub-id pub-id-type="doi">10.1038/s41531-017-0029-x</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sedlazeck</surname>
<given-names>F. J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Darby</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Schatz</surname>
<given-names>M. C.</given-names>
</name>
</person-group> (<year>2018a</year>). <article-title>Piercing the dark matter: bioinformatics of long-range sequencing and mapping</article-title>. <source>Nat. Rev. Genet.</source> <volume>19</volume>, <fpage>329</fpage>&#x2013;<lpage>346</lpage>. <pub-id pub-id-type="doi">10.1038/s41576-018-0003-4</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sedlazeck</surname>
<given-names>F. J.</given-names>
</name>
<name>
<surname>Rescheneder</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Smolka</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Nattestad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>von Haeseler</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2018b</year>). <article-title>Accurate detection of complex structural variations using single-molecule sequencing</article-title>. <source>Nat. Methods</source> <volume>15</volume>, <fpage>461</fpage>&#x2013;<lpage>468</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-018-0001-7</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spies</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Zook</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Salit</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sidow</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>svviz: a read viewer for validating structural variants</article-title>. <source>Bioinformatics</source> <volume>31</volume> (<issue>24</issue>), <fpage>3994</fpage>&#x2013;<lpage>3996</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv478</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sudmant</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Rausch</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gardner</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Handsaker</surname>
<given-names>R. E.</given-names>
</name>
<name>
<surname>Abyzov</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Huddleston</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>An integrated map of structural variation in 2,504 human genomes</article-title>. <source>Nature</source> <volume>526</volume> (<issue>7571</issue>), <fpage>75</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1038/nature15394</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thorvaldsdottir</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Robinson</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Mesirov</surname>
<given-names>J. P.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Integrative Genomics Viewer (IGV): high-performance genomics data visualization and exploration</article-title>. <source>Briefings Bioinforma.</source> <volume>14</volume> (<issue>2</issue>), <fpage>178</fpage>&#x2013;<lpage>192</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbs017</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vogelstein</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Papadopoulos</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Velculescu</surname>
<given-names>V. E.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Diaz</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Kinzler</surname>
<given-names>K. W.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Cancer genome landscapes</article-title>. <source>Science</source> <volume>339</volume>, <fpage>1546</fpage>&#x2013;<lpage>1558</lpage>. <pub-id pub-id-type="doi">10.1126/science.1235122</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hakonarson</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>ANNOVAR: functional annotation of genetic variants from high-throughput sequencing data</article-title>. <source>Nucleic Acids Res.</source> <volume>38</volume> (<issue>16</issue>), <fpage>164</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkq603</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wilkinson</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Charenton</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Nagai</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>RNA splicing by the spliceosome</article-title>. <source>Annu. Rev. Biochem.</source> <volume>89</volume>, <fpage>359</fpage>&#x2013;<lpage>388</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-biochem-091719-064225</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wong</surname>
<given-names>K. K.</given-names>
</name>
<name>
<surname>deLeeuw</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Dosanjh</surname>
<given-names>N. S.</given-names>
</name>
<name>
<surname>Kimm</surname>
<given-names>L. R.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Horsman</surname>
<given-names>D. E.</given-names>
</name>
<etal/>
</person-group> (<year>2007</year>). <article-title>A comprehensive analysis of common copy-number variations in the human genome</article-title>. <source>Am. J. Hum. Genet.</source> <volume>80</volume> (<issue>1</issue>), <fpage>91</fpage>&#x2013;<lpage>104</lpage>. <pub-id pub-id-type="doi">10.1086/510560</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zack</surname>
<given-names>T. I.</given-names>
</name>
<name>
<surname>Schumacher</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>Carter</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Cherniack</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Saksena</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Tabak</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Pan-cancer patterns of somatic copy number alteration</article-title>. <source>Nat. Genet.</source> <volume>45</volume> (<issue>10</issue>), <fpage>1134</fpage>&#x2013;<lpage>1140</lpage>. <pub-id pub-id-type="doi">10.1038/ng.2760</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zook</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Hansen</surname>
<given-names>N. F.</given-names>
</name>
<name>
<surname>Olson</surname>
<given-names>N. D.</given-names>
</name>
<name>
<surname>Chapman</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Mullikin</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A robust benchmark for detection of germline large deletions and insertions</article-title>. <source>Nat. Biotechnol.</source> <volume>38</volume> (<issue>11</issue>), <fpage>1347</fpage>&#x2013;<lpage>1355</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-020-0538-8</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>