<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article article-type="methods-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1089936</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2023.1089936</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Destin2: Integrative and cross-modality analysis of single-cell chromatin accessibility data</article-title>
<alt-title alt-title-type="left-running-head">Guan et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2023.1089936">10.3389/fgene.2023.1089936</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Guan</surname>
<given-names>Peter Y.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lee</surname>
<given-names>Jin Seok</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Lihao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lin</surname>
<given-names>Kevin Z.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mei</surname>
<given-names>Wenwen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Li</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Jiang</surname>
<given-names>Yuchao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1072874/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Biostatistics</institution>, <institution>University of North Carolina at Chapel Hill</institution>, <addr-line>Chapel Hill</addr-line>, <addr-line>NC</addr-line>, <country>Unites States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Genetics</institution>, <institution>University of North Carolina at Chapel Hill</institution>, <addr-line>Chapel Hill</addr-line>, <addr-line>NC</addr-line>, <country>Unites States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Statistics</institution>, <institution>University of Pennsylvania</institution>, <addr-line>Philadelphia</addr-line>, <addr-line>PA</addr-line>, <country>Unites States</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Biostatistics</institution>, <institution>University of Florida</institution>, <addr-line>Gainesville</addr-line>, <addr-line>FL</addr-line>, <country>Unites States</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Lineberger Comprehensive Cancer Center</institution>, <institution>University of North Carolina at Chapel Hill</institution>, <addr-line>Chapel Hill</addr-line>, <addr-line>NC</addr-line>, <country>Unites States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1641101/overview">Zhicheng Ji</ext-link>, Duke University, United States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1092204/overview">Zhixiang Lin</ext-link>, The Chinese University of Hong Kong, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/668193/overview">Rhonda Bacher</ext-link>, University of Florida, United States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Yuchao Jiang, <email>yuchaoj@email.unc.edu</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Statistical Genetics and Methodology, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>02</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1089936</elocation-id>
<history>
<date date-type="received">
<day>04</day>
<month>11</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>02</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Guan, Lee, Wang, Lin, Mei, Chen and Jiang.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Guan, Lee, Wang, Lin, Mei, Chen and Jiang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>We propose Destin2, a novel statistical and computational method for cross-modality dimension reduction, clustering, and trajectory reconstruction for single-cell ATAC-seq data. The framework integrates cellular-level epigenomic profiles from peak accessibility, motif deviation score, and pseudo-gene activity and learns a shared manifold using the multimodal input, followed by clustering and/or trajectory inference. We apply Destin2 to real scATAC-seq datasets with both discretized cell types and transient cell states and carry out benchmarking studies against existing methods based on unimodal analyses. Using cell-type labels transferred with high confidence from unmatched single-cell RNA sequencing data, we adopt four performance assessment metrics and demonstrate how Destin2 corroborates and improves upon existing methods. Using single-cell RNA and ATAC multiomic data, we further exemplify how Destin2&#x2019;s cross-modality integrative analyses preserve true cell-cell similarities using the matched cell pairs as ground truths. Destin2 is compiled as a freely available R package available at <ext-link ext-link-type="uri" xlink:href="https://github.com/yuchaojiang/Destin2">https://github.com/yuchaojiang/Destin2</ext-link>.</p>
</abstract>
<kwd-group>
<kwd>single-cell epigenomics</kwd>
<kwd>single-cell ATAC-seq</kwd>
<kwd>chromatin accessibility</kwd>
<kwd>single-cell multiome</kwd>
<kwd>cross-modality integration</kwd>
</kwd-group>
<contract-num rid="cn001">R35 GM138342</contract-num>
<contract-sponsor id="cn001">National Institute of General Medical Sciences<named-content content-type="fundref-id">10.13039/100000057</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Recent advances in single-cell assay of transposase-accessible chromatin followed by sequencing (scATAC-seq) technologies (<xref ref-type="bibr" rid="B4">Buenrostro et al., 2015</xref>; <xref ref-type="bibr" rid="B8">Cusanovich et al., 2015</xref>; <xref ref-type="bibr" rid="B34">Satpathy et al., 2019</xref>) offer unprecedented opportunities to characterize cellular-level chromatin accessibilities and have been successfully applied to atlas-scale datasets to yield novel insights on epigenomic heterogeneity (<xref ref-type="bibr" rid="B9">Cusanovich et al., 2018</xref>; <xref ref-type="bibr" rid="B11">Domcke et al., 2020</xref>). scATAC-seq data analysis presents unique methodological challenges due to its high noise, sparsity, and dimensionality (<xref ref-type="bibr" rid="B42">Urrutia et al., 2019</xref>). Multiple statistical and computational methods have been developed and evaluated by independent benchmark studies (<xref ref-type="bibr" rid="B6">Chen et al., 2019</xref>).</p>
<p>The first set of methods call ATAC peaks or segment the genome into bins and take the cell by peak (or cell by bin) matrix as input. Among these methods, Signac (<xref ref-type="bibr" rid="B40">Stuart et al., 2021</xref>), scOpen (<xref ref-type="bibr" rid="B23">Li et al., 2021</xref>), and RA3 (<xref ref-type="bibr" rid="B7">Chen et al., 2021</xref>) perform TF-IDF normalization followed by different dimension reduction techniques. SnapATAC (<xref ref-type="bibr" rid="B12">Fang et al., 2021</xref>) computes a Jaccard similarity matrix, while cisTopic (<xref ref-type="bibr" rid="B2">Bravo Gonzalez-Blas et al., 2019</xref>) performs topic modeling. Moving beyond the peak matrix, Cicero (<xref ref-type="bibr" rid="B29">Pliner et al., 2018</xref>) and MAESTRO (<xref ref-type="bibr" rid="B43">Wang et al., 2020</xref>) make gene expression predictions from unweighted and weighted sum of the ATAC reads in gene bodies and promoter regions, respectively; the predicted gene activities have been shown to in the ballpark recapitulate the transcriptomic profiles and discern cell populations (<xref ref-type="bibr" rid="B19">Jiang et al., 2022</xref>). For TF-binding motifs, chromVAR (<xref ref-type="bibr" rid="B35">Schep et al., 2017</xref>) computes a motif deviation score by estimating the gain or loss of accessibility within peaks sharing the same motif relative to the average cell profile; these deviation scores have also been shown to enable accurate clustering of scATAC-seq data.</p>
<p>Notably, most, if not all, of the aforementioned methods carry out &#x201c;unimodal&#x201d; analysis with a single type of feature input (i.e., peaks, genes, or motifs). One of the earliest methods, SCRAT (<xref ref-type="bibr" rid="B18">Ji et al., 2017</xref>), proposes to use empirical and prior knowledge to aggregate the peaks into genes, motifs, and gene sets, while neglecting the peak-level information due to high computational burden. EpiScanpy (<xref ref-type="bibr" rid="B10">Danese et al., 2021</xref>), ArchR (<xref ref-type="bibr" rid="B14">Granja et al., 2021</xref>), and Signac (<xref ref-type="bibr" rid="B40">Stuart et al., 2021</xref>) all generate multimodal feature inputs. However, dimension reduction and clustering are still focused on the peak accessibilities&#x2014;the gene activities are generally integrated with single-cell RNA sequencing (scRNA-seq) data for alignment, and the motif deviation scores are used to identify enriched and/or differentially accessible motifs.</p>
<p>To our best knowledge, no integrative methods are available for a cross-modality analysis of scATAC-seq data, yet it has been shown that the peaks, genes, and motifs all contain signals to separate the different cell types/states. Here, we propose Destin2, a successor to our previous unimodal method Destin (<xref ref-type="bibr" rid="B42">Urrutia et al., 2019</xref>), for cross-modality dimension reduction, clustering, and trajectory reconstruction for scATAC-seq data. The framework integrates cellular-level epigenomic profiles from peak accessibility, motif deviation score, and pseudo-gene activity and learns a shared manifold using the multimodal input. We apply the method to real datasets with both discretized cell types and transient cell states and carry out benchmarking studies to demonstrate how Destin2&#x2019;s cross-modality integration corroborates and improves upon existing methods based on unimodal analyses.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and methods</title>
<p>
<xref ref-type="fig" rid="F1">Figure 1</xref> outlines Destin2&#x2019;s analytical framework. For unimodal data input, Destin2 utilizes Signac (<xref ref-type="bibr" rid="B40">Stuart et al., 2021</xref>), MAESTRO (<xref ref-type="bibr" rid="B43">Wang et al., 2020</xref>), and chromVAR (<xref ref-type="bibr" rid="B35">Schep et al., 2017</xref>) for pre-processing and generating the matrices of peak accessibility, gene activity, and motif deviation, where the cell dimensions are matched, and yet the feature dimensions differ. The peak matrix can be directly loaded from the output of cellranger-atac or called/refined by MACS2 (<xref ref-type="bibr" rid="B48">Zhang et al., 2008</xref>). Pseudo-gene activities can be derived from either taking the sum of ATAC reads in gene bodies and promoter regions by Signac (<xref ref-type="bibr" rid="B40">Stuart et al., 2021</xref>) or using a regulatory potential model that sums ATAC reads weighted based on existing gene annotations by MAESTRO (<xref ref-type="bibr" rid="B43">Wang et al., 2020</xref>). Motif deviation scores are computed using chromVAR (<xref ref-type="bibr" rid="B35">Schep et al., 2017</xref>) and measure the deviation in chromatin accessibility across the set of peaks containing the TF-binding motifs, compared to a set of background peaks. Destin2, by its default, uses the JASPAR database for pairs of TF and motif annotation in vertebrates (<xref ref-type="bibr" rid="B13">Fornes et al., 2020</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>A flowchart outlining the procedures for cross-modality scATAC-seq analysis by Destin2.</p>
</caption>
<graphic xlink:href="fgene-14-1089936-g001.tif"/>
</fig>
<p>For data normalization and dimension reduction, we adopt two parallel and state-of-the-art approaches, latent semantic indexing (LSI) and latent Dirichlet allocation (LDA), for the peak matrix. LSI normalizes reads within peaks using the term frequency-inverse document frequency transformation (TF-IDF), followed by a PCA-based dimension reduction (<xref ref-type="bibr" rid="B40">Stuart et al., 2021</xref>). LDA is a topic modeling approach commonly used in natural language processing and has been successfully applied to scATAC-seq data to identify cell states from topic-cell distribution and explore <italic>cis</italic>-regulatory regions from region-topic distribution by cisTopic (<xref ref-type="bibr" rid="B2">Bravo Gonzalez-Blas et al., 2019</xref>). For the motif and gene matrix, we use <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>z</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-score transformation and the LogNormalize function by Seurat (<xref ref-type="bibr" rid="B5">Butler et al., 2018</xref>), followed by principal component analysis (PCA), respectively. These within-modality normalization and dimension reduction, which return peak principal components (PCs), motif PCs, and gene PCs, are necessary. They effectively reduce signal-to-noise ratios, and more importantly, it has been shown that PCA, followed by canonical correlation analysis (CCA), offers a powerful approach to uncover latent structure shared across modalities through an integrative analysis (<xref ref-type="bibr" rid="B3">Brown et al., 2018</xref>). The number of PCs can be chosen by inspecting the variance reduction (i.e., elbow) plot or using the JackStraw method (<xref ref-type="bibr" rid="B33">Satija et al., 2015</xref>), which randomly permutes a subset of the data and compares the PCs for the permuted data with the observed PCs to determine statistical significance.</p>
<p>With the pre-processed and normalized unimodal data input, Destin2 offers three options for cross-modality integration: consensus PCA (CPCA), generalized/multiple CCA (MultiCCA), and weighted nearest neighbor (WNN). Denote the feature input across <inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> modalities as <inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi mathvariant="double-struck">R</mml:mi>
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi mathvariant="double-struck">R</mml:mi>
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>K</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, where the <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> cells are matched. (I) CPCA (<xref ref-type="bibr" rid="B45">Westerhuis et al., 1998</xref>), algebraically equivalent to applying a second-step PCA to the concatenated peak PCs, motif PCs, and gene PCs, returns consensus PCs as joint dimension reductions, which reveal the union of the latent structure across multiple modalities. To identify the first-rank consensus PC is analogous to solve:<disp-formula id="equ1">
<mml:math id="m5">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="{" close="}" separators="|">
<mml:mrow>
<mml:msup>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>argmin</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mfenced open="&#x2016;" close="&#x2016;" separators="|">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mi>T</mml:mi>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>such that <inline-formula id="inf5">
<mml:math id="m6">
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi mathvariant="double-struck">R</mml:mi>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> for <inline-formula id="inf6">
<mml:math id="m7">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>k</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf7">
<mml:math id="m8">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="&#x2016;" close="&#x2016;" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>&#x2b;</mml:mo>
<mml:mrow>
<mml:mfenced open="&#x2016;" close="&#x2016;" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> (II) MultiCCA (<xref ref-type="bibr" rid="B20">Kettenring, 1971</xref>), on the other hand, finds maximally correlated linear combinations of the features between each pair of modalities by solving:<disp-formula id="equ2">
<mml:math id="m9">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="{" close="}" separators="|">
<mml:mrow>
<mml:msup>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mover accent="true">
<mml:mi>w</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>argmax</mml:mi>
<mml:msub>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msup>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mi>T</mml:mi>
</mml:msup>
<mml:msup>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mi>T</mml:mi>
</mml:msup>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>such that <inline-formula id="inf8">
<mml:math id="m10">
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi mathvariant="double-struck">R</mml:mi>
<mml:msub>
<mml:mi>p</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf9">
<mml:math id="m11">
<mml:mrow>
<mml:msup>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mi>T</mml:mi>
</mml:msup>
<mml:msup>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mi>T</mml:mi>
</mml:msup>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> for <inline-formula id="inf10">
<mml:math id="m12">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>k</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>; we utilize the implementation from the mogsa package (<xref ref-type="bibr" rid="B28">Meng et al., 2019</xref>) in R. (III) Instead of optimizing for the modality- and feature-specific loading vector for projections of the three modalities, the recently developed WNN method (<xref ref-type="bibr" rid="B16">Hao et al., 2021</xref>) learns cell- and modality-specific weights, which reflect the information content for each modality and are used to calculate a weighted cell-cell similarity measure and construct a WNN graph. We will not go into the algorithmic details of the WNN method&#x2014;readers can refer to the Seurat V4 publication (<xref ref-type="bibr" rid="B16">Hao et al., 2021</xref>), where the WNN framework is extended to more than two modalities with matched cells.</p>
<p>Followed by joint dimension reduction and graph construction, tSNE/UMAP can be used for visualization. Destin2 adopts Louvain/Leiden clustering (<xref ref-type="bibr" rid="B41">Traag et al., 2019</xref>) for community detection and identification of discrete cell clusters. The number of cell clusters (i.e., the resolution parameter) can be optimized using the clustree method (<xref ref-type="bibr" rid="B47">Zappia and Oshlack, 2018</xref>), which builds a tree to visualize and examine how clusters are related to each other at varying resolutions, allowing researchers to assess which clusters are distinct and which are unstable with the use of additional metrics such as the SC3 stability index (<xref ref-type="bibr" rid="B21">Kiselev et al., 2017</xref>). For cell population exhibiting continuous and connected cell states, Destin2 resorts to a flexible and modularized approach, Slingshot (<xref ref-type="bibr" rid="B38">Street et al., 2018</xref>), for trajectory reconstruction; smooth representation of the lineages and pseudotime values are inferred using the joint dimension reduction and visualized on the UMAP space.</p>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>Destin2 improves clustering accuracy compared to unimodal analysis methods</title>
<p>We apply Destin2 to four scATAC-seq datasets of human peripheral blood mononuclear cells (PBMCs) from 10x Genomics, adult mouse cortex cells from 10x Genomics, human bone marrow mononuclear cells (BMMCs) (<xref ref-type="bibr" rid="B15">Granja et al., 2019</xref>), and human fetal organs (<xref ref-type="bibr" rid="B11">Domcke et al., 2020</xref>). See <xref ref-type="sec" rid="s10">Supplementary Table S1</xref> for summary and details of the data. For the PBMC and adult mouse cortex datasets, we annotate cell types using scRNA-seq experiments from the same biological systems (PBMC from 10x Genomics and mouse brain from the Allen Brain Institute), utilizing the CCA-based method for cross-modality integration and label transfer (<xref ref-type="bibr" rid="B39">Stuart et al., 2019</xref>) and only keeping cells that can be uniquely and confidently assigned to one cell type. For the BMMC dataset, we use the curated cell type labels from the original publication (<xref ref-type="bibr" rid="B15">Granja et al., 2019</xref>). For the human fetal dataset, we resort to the tissues of origin from the experimental design/sample collection. These cell types/tissues are used as ground truths for performance assessment.</p>
<p>We apply unimodal analysis methods (i.e., peak analysis by Signac and cisTopic, motif analysis by chromVAR, and gene activity analysis by Signac/MAESTRO) and Destin2 to these datasets, with UMAP visualizations shown in <xref ref-type="sec" rid="s10">Supplementary Figure S1</xref>. For benchmarking, we adopt four metrics for performance assessment. (I) Adjusted rand index (ARI) is used to compare the identified cell clusters against the annotated cell types, with 1 indicating that the two are exactly the same. (II) Adjusted mutual information (AMI) is similar to ARI but is more suited when there exist small and unbalanced clusters (<xref ref-type="bibr" rid="B32">Romano et al., 2016</xref>). (III) Homogeneity score (H-score) is an entropy-based measure of the similarity between two clusterings and ranges between 0 and 1, where 1 indicates perfect homogeneity. (IV) Cell-type local inverse Simpson&#x2019;s index (cLISI) (<xref ref-type="bibr" rid="B22">Korsunsky et al., 2019</xref>) is used to assess the degree of mixing/separation of annotated cell types, with 1 indicating that the different cell types group separately and 2 indicating that the different cell types erroneously group together.</p>
<p>Across the four scATAC-seq datasets, our results suggest that the multimodal analysis methods proposed by Destin2 improve clustering accuracy compared to conventional unimodal analysis methods using ARI and AMI as assessment metrics (<xref ref-type="fig" rid="F2">Figure 2</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S2</xref>). For cLISI and H-score, since the gold-standard cell-type labels are transferred using the LSI-based dimension reduction as weights, it is not surprising that the LSI method achieves the top performance; non-etheless, the difference between LSI-based methods and Destin2&#x2019;s cross-modality integration results are negligible (<xref ref-type="fig" rid="F2">Figure 2</xref>; <xref ref-type="sec" rid="s10">Supplementary Table S2</xref>). Note that while the motif analysis returns the seemingly worst result, whether the motif modality is included in the integrative analysis does not significantly alter the output (<xref ref-type="sec" rid="s10">Supplementary Figure S2</xref>), demonstrating Destin2&#x2019;s robustness to the differential information content across modalities. Additionally, and more importantly, careful inspection of the confusion matrix (shown as a heatmap in <xref ref-type="sec" rid="s10">Supplementary Figure S3</xref>) suggests that Destin2 is able to identify cell types/states that are otherwise indistinguishable and/or wrongly classified from a unimodal analysis&#x2014;e.g., Lamp5 v.s. Vip in <xref ref-type="sec" rid="s10">Supplementary Figure S3B</xref>, as well as GMP v.s. CD14 monocytes and CLP v.s. pre-B cells in <xref ref-type="sec" rid="s10">Supplementary Figure S3C</xref>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Benchmarking clustering accuracy. Four different metrics&#x2014;ARI, AMI, H-score, and cLISI&#x2014;were used for performance assessment. For each metric and each method, results from the four unimodal scATAC-seq datasets are aggregated (i.e., each boxplot contains four data points). The ranks of the methods for each metric are computed and then combined across all metrics and datasets. Destin2&#x2019;s multimodal analysis framework achieves the highest rank and improves clustering accuracy compared to conventional unimodal analysis methods.</p>
</caption>
<graphic xlink:href="fgene-14-1089936-g002.tif"/>
</fig>
<p>For downstream analysis, we first demonstrate how to determine the clustering resolution using the clustree method (<xref ref-type="sec" rid="s10">Supplementary Figure S4</xref>). Specifically, clustering results with varying clustering resolutions [and thus varying SC3 stability measures (<xref ref-type="bibr" rid="B21">Kiselev et al., 2017</xref>)] are visualized as a tree: new clusters form from existing clusters, and the overlap in cells between clusters at adjacent resolutions is computed and used to calculate the in-proportion for each edge. Unstable clusters result in cells switching between branches of the trees, with low in-proportion edges; one can thus infer which areas of the tree are likely to be the result of true clusters and which are caused by over-clustering (<xref ref-type="bibr" rid="B47">Zappia and Oshlack, 2018</xref>). For cell populations with continuous cell states, we further demonstrate how to reconstruct the development/differentiation trajectory using Destin2&#x2019;s joint dimension reduction paired with the Slingshot method. As an example, we show the reconstruction of the true branching lineages during human hematopoietic differentiation using the BMMC data (<xref ref-type="sec" rid="s10">Supplementary Figure S5</xref>).</p>
</sec>
<sec id="s3-2">
<title>Destin2 better preserves cell-cell similarities using single-cell RNA and ATAC multiomic data</title>
<p>We further applied Destin2 to three single-cell RNA and ATAC multiomic datasets of human PBMCs from 10x Genomics, adult mouse cortex cells from 10x Genomics, and mouse skin data from SHARE-seq (<xref ref-type="bibr" rid="B27">Ma et al., 2020</xref>). See <xref ref-type="sec" rid="s10">Supplementary Table S1</xref> for a data summary. In using these multiomic datasets, we demonstrate how Destin2&#x2019;s cross-modality analyses preserve true cell-cell similarities by using the matched cell information as ground truth. Importantly, this also does not need the RNA-ATAC alignment or the transfer of discretized cell-type labels, which often fails for cell populations consisting of transient states.</p>
<p>Specifically, we first obtained the low-dimensional embedding using the ATAC data alone by the various unimodal methods and Destin2&#x2019;s multimodal methods. We then reconstructed the low-dimensional embedding using the RNA data using Seurat&#x2019;s scRNA-seq processing pipeline (<xref ref-type="bibr" rid="B5">Butler et al., 2018</xref>). We then assess how the low-dimensional embedding by the ATAC domain agrees with that by the RNA domain. For benchmarking, we adopt two additional metrics designed specifically for the single-cell multiomic data&#x2014;fraction of samples closer than the nearest neighbor (FOSCTTNN) and agreement. Both metrics measure the preservation of a cell&#x2019;s nearest neighbors between the RNA and ATAC domains and do not rely on annotated cell types or identified clusters. FOSCTTNN is adapted from the &#x201c;fraction of samples closer than the true match&#x201d; metric (<xref ref-type="bibr" rid="B25">Liu et al., 2019</xref>): for each cell, we first identify its nearest neighbor (i.e., closest cell) in the RNA domain as ground truth, and then, in the ATAC domain, we calculate the fraction of cells that are closer than its true nearest neighbor. For agreement (<xref ref-type="bibr" rid="B44">Welch et al., 2019</xref>), we identify each cell&#x2019;s <inline-formula id="inf11">
<mml:math id="m13">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> nearest neighbors in the RNA and ATAC domains, respectively, and then calculate the fraction of overlap. Nearest neighbors are identified using Euclidean distance of the cells&#x2019; reduced dimension from each modality and method. The two cell-specific metrics can be further summarized using median and Gini mean difference (GMD) across cells.</p>
<p>For the three multiomic datasets, our results suggest that the multimodal analysis methods offered by Destin2 exhibit top or near-top performance. For FOSCTTNN, Destin2&#x2019;s cross-modality integration results are either top-performing or negligibly different from the top performer (<xref ref-type="table" rid="T1">Table 1</xref>); for agreement across different <inline-formula id="inf12">
<mml:math id="m14">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> (number of nearest neighbors), the WNN method achieves the top performance (<xref ref-type="table" rid="T2">Table 2</xref>). Interestingly and importantly, neither LSI nor LDA is indefinitely preferred from this benchmark analysis&#x2014;e.g., LDA outperforms LSI using the FOSCTTNN metric in the PBMC data (<xref ref-type="table" rid="T1">Table 1</xref>), while LSI improves upon LDA using the agreement metric by a large margin in the mouse brain data (<xref ref-type="table" rid="T2">Table 2</xref>). In real data analysis, where there is no ground truth to guide method selection, Destin2 integrates and corroborates information from both methods and demonstrates its robustness.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>FOSCTTNN metrics on single-cell RNA and ATAC multiomic datasets. Destin2&#x2019;s multimodal analyses achieve top or near-top performance. FOSCTTNN is bound between 0 and 1, with 0 being the best performance. Neither LSI nor LDA is indefinitely preferred from this benchmark analysis; Destin2 integrates and corroborates information across methods and modalities.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="7" align="left">(A) PBMC 10x Genomics FOSCTTNN</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<bold>Method</bold>
</td>
<td align="center">
<bold>q1</bold>
</td>
<td align="center">
<bold>Median</bold>
</td>
<td align="center">
<bold>GMD</bold>
</td>
<td align="center">
<bold>Mean</bold>
</td>
<td align="center">
<bold>sd</bold>
</td>
<td align="center">
<bold>q3</bold>
</td>
</tr>
<tr>
<td align="center">Peak_LSI</td>
<td align="center">0.015</td>
<td align="center">0.045</td>
<td align="center">0.107</td>
<td align="center">0.089</td>
<td align="center">0.126</td>
<td align="center">0.116</td>
</tr>
<tr>
<td align="center">Peak_LDA</td>
<td align="center">0.013</td>
<td align="center">0.039</td>
<td align="center">0.081</td>
<td align="center">0.069</td>
<td align="center">0.095</td>
<td align="center">0.090</td>
</tr>
<tr>
<td align="center">Motif</td>
<td align="center">0.048</td>
<td align="center">0.131</td>
<td align="center">0.168</td>
<td align="center">0.174</td>
<td align="center">0.158</td>
<td align="center">0.261</td>
</tr>
<tr>
<td align="center">GeneActivity</td>
<td align="center">0.017</td>
<td align="center">0.054</td>
<td align="center">0.124</td>
<td align="center">0.104</td>
<td align="center">0.133</td>
<td align="center">0.137</td>
</tr>
<tr>
<td align="center">ConsensusPCA</td>
<td align="center">0.014</td>
<td align="center">0.045</td>
<td align="center">0.098</td>
<td align="center">0.084</td>
<td align="center">0.107</td>
<td align="center">0.118</td>
</tr>
<tr>
<td align="center">MultiCCA</td>
<td align="center">0.014</td>
<td align="center">0.044</td>
<td align="center">0.104</td>
<td align="center">0.086</td>
<td align="center">0.121</td>
<td align="center">0.112</td>
</tr>
<tr>
<td align="center">WNN</td>
<td align="center">0.013</td>
<td align="center">0.042</td>
<td align="center">0.094</td>
<td align="center">0.080</td>
<td align="center">0.102</td>
<td align="center">0.110</td>
</tr>
<tr>
<td colspan="7" align="left">(B) Mouse Brain 10x Genomics FOSCTTNN</td>
</tr>
<tr>
<td align="center">
<bold>Method</bold>
</td>
<td align="center">
<bold>q1</bold>
</td>
<td align="center">
<bold>Median</bold>
</td>
<td align="center">
<bold>GMD</bold>
</td>
<td align="center">
<bold>Mean</bold>
</td>
<td align="center">
<bold>sd</bold>
</td>
<td align="center">
<bold>q3</bold>
</td>
</tr>
<tr>
<td align="center">Peak_LSI</td>
<td align="center">0.004</td>
<td align="center">0.014</td>
<td align="center">0.085</td>
<td align="center">0.056</td>
<td align="center">0.130</td>
<td align="center">0.043</td>
</tr>
<tr>
<td align="center">Peak_LDA</td>
<td align="center">0.006</td>
<td align="center">0.021</td>
<td align="center">0.077</td>
<td align="center">0.056</td>
<td align="center">0.110</td>
<td align="center">0.056</td>
</tr>
<tr>
<td align="center">Motif</td>
<td align="center">0.010</td>
<td align="center">0.033</td>
<td align="center">0.105</td>
<td align="center">0.079</td>
<td align="center">0.133</td>
<td align="center">0.085</td>
</tr>
<tr>
<td align="center">GeneActivity</td>
<td align="center">0.028</td>
<td align="center">0.109</td>
<td align="center">0.308</td>
<td align="center">0.257</td>
<td align="center">0.294</td>
<td align="center">0.487</td>
</tr>
<tr>
<td align="center">ConsensusPCA</td>
<td align="center">0.005</td>
<td align="center">0.017</td>
<td align="center">0.088</td>
<td align="center">0.059</td>
<td align="center">0.129</td>
<td align="center">0.049</td>
</tr>
<tr>
<td align="center">MultiCCA</td>
<td align="center">0.005</td>
<td align="center">0.017</td>
<td align="center">0.083</td>
<td align="center">0.057</td>
<td align="center">0.122</td>
<td align="center">0.050</td>
</tr>
<tr>
<td align="center">WNN</td>
<td align="center">0.005</td>
<td align="center">0.018</td>
<td align="center">0.091</td>
<td align="center">0.062</td>
<td align="center">0.130</td>
<td align="center">0.055</td>
</tr>
<tr>
<td colspan="7" align="left">(C) Mouse Skin SHARE-seq FOSCTTNN</td>
</tr>
<tr>
<td align="center">
<bold>Method</bold>
</td>
<td align="center">
<bold>q1</bold>
</td>
<td align="center">
<bold>Median</bold>
</td>
<td align="center">
<bold>GMD</bold>
</td>
<td align="center">
<bold>Mean</bold>
</td>
<td align="center">
<bold>sd</bold>
</td>
<td align="center">
<bold>q3</bold>
</td>
</tr>
<tr>
<td align="center">Peak_LSI</td>
<td align="center">0.011</td>
<td align="center">0.034</td>
<td align="center">0.165</td>
<td align="center">0.117</td>
<td align="center">0.196</td>
<td align="center">0.110</td>
</tr>
<tr>
<td align="center">Peak_LDA</td>
<td align="center">0.011</td>
<td align="center">0.036</td>
<td align="center">0.143</td>
<td align="center">0.104</td>
<td align="center">0.174</td>
<td align="center">0.101</td>
</tr>
<tr>
<td align="center">Motif</td>
<td align="center">0.024</td>
<td align="center">0.076</td>
<td align="center">0.185</td>
<td align="center">0.154</td>
<td align="center">0.194</td>
<td align="center">0.200</td>
</tr>
<tr>
<td align="center">GeneActivity</td>
<td align="center">0.062</td>
<td align="center">0.208</td>
<td align="center">0.332</td>
<td align="center">0.323</td>
<td align="center">0.301</td>
<td align="center">0.551</td>
</tr>
<tr>
<td align="center">ConsensusPCA</td>
<td align="center">0.011</td>
<td align="center">0.034</td>
<td align="center">0.147</td>
<td align="center">0.105</td>
<td align="center">0.180</td>
<td align="center">0.097</td>
</tr>
<tr>
<td align="center">MultiCCA</td>
<td align="center">0.011</td>
<td align="center">0.034</td>
<td align="center">0.139</td>
<td align="center">0.100</td>
<td align="center">0.176</td>
<td align="center">0.092</td>
</tr>
<tr>
<td align="center">WNN</td>
<td align="center">0.010</td>
<td align="center">0.031</td>
<td align="center">0.134</td>
<td align="center">0.096</td>
<td align="center">0.170</td>
<td align="center">0.091</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Agreement metrics on single-cell RNA and ATAC multiomic datasets. Different numbers of nearest numbers (<inline-formula id="inf13">
<mml:math id="m15">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>) were selected. Destin2&#x2019;s multimodal analyses, especially the WNN method, achieve top or near-top performance. Agreement is bound between 0 and 1, with 1 being the best performance. Neither LSI nor LDA is indefinitely preferred from this benchmark analysis; Destin2 integrates and corroborates information across methods and modalities.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="8" align="left">(A) PBMC 10x Genomics Agreement</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<bold>k</bold>
</td>
<td align="center">
<bold>Peak_LSI</bold>
</td>
<td align="center">
<bold>Peak_LDA</bold>
</td>
<td align="center">
<bold>Motif</bold>
</td>
<td align="center">
<bold>Gene Activity</bold>
</td>
<td align="center">
<bold>Consensus PCA</bold>
</td>
<td align="center">
<bold>MultiCCA</bold>
</td>
<td align="center">
<bold>WNN</bold>
</td>
</tr>
<tr>
<td align="center">50</td>
<td align="center">0.091</td>
<td align="center">0.102</td>
<td align="center">0.032</td>
<td align="center">0.085</td>
<td align="center">0.092</td>
<td align="center">0.091</td>
<td align="center">0.107</td>
</tr>
<tr>
<td align="center">100</td>
<td align="center">0.163</td>
<td align="center">0.175</td>
<td align="center">0.061</td>
<td align="center">0.150</td>
<td align="center">0.163</td>
<td align="center">0.163</td>
<td align="center">0.183</td>
</tr>
<tr>
<td align="center">150</td>
<td align="center">0.220</td>
<td align="center">0.232</td>
<td align="center">0.086</td>
<td align="center">0.200</td>
<td align="center">0.219</td>
<td align="center">0.221</td>
<td align="center">0.241</td>
</tr>
<tr>
<td align="center">200</td>
<td align="center">0.269</td>
<td align="center">0.282</td>
<td align="center">0.110</td>
<td align="center">0.244</td>
<td align="center">0.268</td>
<td align="center">0.270</td>
<td align="center">0.290</td>
</tr>
<tr>
<td colspan="8" align="left">(B) Mouse Brain 10x Genomics Agreement</td>
</tr>
<tr>
<td align="center">
<bold>k</bold>
</td>
<td align="center">
<bold>Peak_LSI</bold>
</td>
<td align="center">
<bold>Peak_LDA</bold>
</td>
<td align="center">
<bold>Motif</bold>
</td>
<td align="center">
<bold>Gene Activity</bold>
</td>
<td align="center">
<bold>Consensus PCA</bold>
</td>
<td align="center">
<bold>MultiCCA</bold>
</td>
<td align="center">
<bold>WNN</bold>
</td>
</tr>
<tr>
<td align="center">50</td>
<td align="center">0.350</td>
<td align="center">0.288</td>
<td align="center">0.222</td>
<td align="center">0.119</td>
<td align="center">0.324</td>
<td align="center">0.318</td>
<td align="center">0.314</td>
</tr>
<tr>
<td align="center">100</td>
<td align="center">0.514</td>
<td align="center">0.439</td>
<td align="center">0.358</td>
<td align="center">0.196</td>
<td align="center">0.481</td>
<td align="center">0.478</td>
<td align="center">0.468</td>
</tr>
<tr>
<td align="center">150</td>
<td align="center">0.613</td>
<td align="center">0.549</td>
<td align="center">0.455</td>
<td align="center">0.255</td>
<td align="center">0.584</td>
<td align="center">0.583</td>
<td align="center">0.569</td>
</tr>
<tr>
<td align="center">200</td>
<td align="center">0.681</td>
<td align="center">0.629</td>
<td align="center">0.532</td>
<td align="center">0.306</td>
<td align="center">0.659</td>
<td align="center">0.658</td>
<td align="center">0.643</td>
</tr>
<tr>
<td colspan="8" align="left">(C) Mouse Skin SHARE-seq Agreement</td>
</tr>
<tr>
<td align="center">
<bold>k</bold>
</td>
<td align="center">
<bold>Peak_LSI</bold>
</td>
<td align="center">
<bold>Peak_LDA</bold>
</td>
<td align="center">
<bold>Motif</bold>
</td>
<td align="center">
<bold>Gene Activity</bold>
</td>
<td align="center">
<bold>Consensus PCA</bold>
</td>
<td align="center">
<bold>MultiCCA</bold>
</td>
<td align="center">
<bold>WNN</bold>
</td>
</tr>
<tr>
<td align="center">50</td>
<td align="center">0.046</td>
<td align="center">0.048</td>
<td align="center">0.024</td>
<td align="center">0.010</td>
<td align="center">0.046</td>
<td align="center">0.046</td>
<td align="center">0.050</td>
</tr>
<tr>
<td align="center">100</td>
<td align="center">0.088</td>
<td align="center">0.088</td>
<td align="center">0.047</td>
<td align="center">0.020</td>
<td align="center">0.087</td>
<td align="center">0.085</td>
<td align="center">0.094</td>
</tr>
<tr>
<td align="center">150</td>
<td align="center">0.124</td>
<td align="center">0.122</td>
<td align="center">0.068</td>
<td align="center">0.030</td>
<td align="center">0.123</td>
<td align="center">0.122</td>
<td align="center">0.131</td>
</tr>
<tr>
<td align="center">200</td>
<td align="center">0.157</td>
<td align="center">0.154</td>
<td align="center">0.087</td>
<td align="center">0.039</td>
<td align="center">0.156</td>
<td align="center">0.155</td>
<td align="center">0.166</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>We propose Destin2 to integrate multimodal peak accessibility, motif deviation, and pseudo-gene activity measures derived from scATAC-seq data. Destin2&#x2019;s cross-modality integration can finish within a few minutes on a local computer; the computational bottleneck comes from the preprocessing step, which can also finish reasonably fast within an hour across tens of thousands of cells (<xref ref-type="sec" rid="s10">Supplementary Table S3</xref>). For peak accessibility, Destin2 integrates two most popular techniques&#x2014;LSI and LDA&#x2014;for data pre-processing and within-modality dimension reduction. While Destin2 is not restricted to only taking peak accessibilities as input, our framework offers a strategy to ensemble results from the various peak-modeling methods (<xref ref-type="bibr" rid="B6">Chen et al., 2019</xref>), so long as method-specific dimension reductions are provided. For motif deviation, Destin2, by its default, resorts to chromVAR (<xref ref-type="bibr" rid="B35">Schep et al., 2017</xref>), which can be computationally intensive and infeasible to handle atlas-scale scATAC-seq data. While alternative methods are currently being developed for higher scalability, a viable shortcut solution is to process the entire data in mini batches (i.e., random subsamples of the cells), thus not requiring all the data to be loaded into memory at one time. Such a strategy has been successfully applied to scRNA-seq data with millions of cells (<xref ref-type="bibr" rid="B17">Hicks et al., 2021</xref>). For pseudo-gene activity, Destin2 aggregates ATAC reads over gene bodies and promoter regions using Signac (<xref ref-type="bibr" rid="B40">Stuart et al., 2021</xref>) or MAESTRO (<xref ref-type="bibr" rid="B43">Wang et al., 2020</xref>), yet this largely neglects peaks and fragments from intergenic and non-coding regions. Additional annotations, such as the enhancers (<xref ref-type="bibr" rid="B36">Shlyueva et al., 2014</xref>), super-enhancers (<xref ref-type="bibr" rid="B30">Pott and Lieb, 2015</xref>), A/B compartments (<xref ref-type="bibr" rid="B24">Lieberman-Aiden et al., 2009</xref>), and chromatin loops (<xref ref-type="bibr" rid="B31">Rao et al., 2014</xref>), can be easily incorporated into Destin2&#x2019;s framework as additional modalities to be integrated.</p>
<p>For cross-modality joint modeling, Destin2 utilizes three statistically rigorous and computationally efficient methods&#x2014;CPCA, MultiCCA, and WNN&#x2014;and shows its outperformance and robustness. Additional methods that fall in the realm of multiomic integration [e.g., JIVE (<xref ref-type="bibr" rid="B26">Lock et al., 2013</xref>), MOFA (<xref ref-type="bibr" rid="B1">Argelaguet et al., 2018</xref>), <italic>etc.</italic>] have not been thoroughly explored. For CCA, its variants and extensions, such as sparse CCA (<xref ref-type="bibr" rid="B46">Witten et al., 2009</xref>) and decomposition-based CCA (<xref ref-type="bibr" rid="B37">Shu et al., 2020</xref>), can potentially further boost performance. Overall, we believe that the framework by Destin2 introduces the concept of multiomic integration to scATAC-seq data; through the various benchmarking studies, we exemplify its utility and benefit and illustrate how it can better facilitate downstream analyses.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>YJ initiated and envisioned the study. YJ, PG, JL, and LW developed and implemented the algorithm. All authors carried out data analyses. YJ and PG compiled the R package. YJ and PG wrote the manuscript, which was edited and approved by all authors.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This work was supported by the National Institutes of Health (NIH) grant R35 GM138342 to YJ.</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2023.1089936/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2023.1089936/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.PDF" id="SM1" mimetype="application/PDF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Argelaguet</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Velten</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Arnol</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dietrich</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zenz</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Marioni</surname>
<given-names>J. C.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Multi-Omics Factor Analysis-a framework for unsupervised integration of multi-omics data sets</article-title>. <source>Mol. Syst. Biol.</source> <volume>14</volume>, <fpage>e8124</fpage>. <pub-id pub-id-type="doi">10.15252/msb.20178124</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bravo Gonzalez-Blas</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Minnoye</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Papasokrati</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Aibar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hulselmans</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Christiaens</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>cisTopic: cis-regulatory topic modeling on single-cell ATAC-seq data</article-title>. <source>Nat. Methods</source> <volume>16</volume>, <fpage>397</fpage>&#x2013;<lpage>400</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-019-0367-1</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname>
<given-names>B. C.</given-names>
</name>
<name>
<surname>Bray</surname>
<given-names>N. L.</given-names>
</name>
<name>
<surname>Pachter</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Expression reflects population structure</article-title>. <source>PLoS Genet.</source> <volume>14</volume>, <fpage>e1007841</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1007841</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buenrostro</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Litzenburger</surname>
<given-names>U. M.</given-names>
</name>
<name>
<surname>Ruff</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Gonzales</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Snyder</surname>
<given-names>M. P.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Single-cell chromatin accessibility reveals principles of regulatory variation</article-title>. <source>Nature</source> <volume>523</volume>, <fpage>486</fpage>&#x2013;<lpage>490</lpage>. <pub-id pub-id-type="doi">10.1038/nature14590</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Butler</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hoffman</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Smibert</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Papalexi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Satija</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Integrating single-cell transcriptomic data across different conditions, technologies, and species</article-title>. <source>Nat. Biotechnol.</source> <volume>36</volume>, <fpage>411</fpage>&#x2013;<lpage>420</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.4096</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Lareau</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Andreani</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Vinyard</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Garcia</surname>
<given-names>S. P.</given-names>
</name>
<name>
<surname>Clement</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Assessment of computational methods for the analysis of single-cell ATAC-seq data</article-title>. <source>Genome Biol.</source> <volume>20</volume>, <fpage>241</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-019-1854-5</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>RA3 is a reference-guided approach for epigenetic characterization of single cells</article-title>. <source>Nat. Commun.</source> <volume>12</volume>, <fpage>2177</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-021-22495-4</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cusanovich</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Daza</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Adey</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pliner</surname>
<given-names>H. A.</given-names>
</name>
<name>
<surname>Christiansen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gunderson</surname>
<given-names>K. L.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Multiplex single cell profiling of chromatin accessibility by combinatorial cellular indexing</article-title>. <source>Science</source> <volume>348</volume>, <fpage>910</fpage>&#x2013;<lpage>914</lpage>. <pub-id pub-id-type="doi">10.1126/science.aab1601</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cusanovich</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Hill</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Aghamirzaie</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Daza</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Pliner</surname>
<given-names>H. A.</given-names>
</name>
<name>
<surname>Berletch</surname>
<given-names>J. B.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>A single-cell atlas of <italic>in vivo</italic> mammalian chromatin accessibility</article-title>. <source>Cell</source> <volume>174</volume>, <fpage>1309</fpage>&#x2013;<lpage>1324.e18</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2018.06.052</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Danese</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Richter</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Chaichoompu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Fischer</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Theis</surname>
<given-names>F. J.</given-names>
</name>
<name>
<surname>Colome-Tatche</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>EpiScanpy: Integrated single-cell epigenomic analysis</article-title>. <source>Nat. Commun.</source> <volume>12</volume>, <fpage>5228</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-021-25131-3</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Domcke</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hill</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Daza</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>O&#x27;Day</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Pliner</surname>
<given-names>H. A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A human cell atlas of fetal chromatin accessibility</article-title>. <source>Science</source> <volume>370</volume>, <fpage>eaba7612</fpage>. <pub-id pub-id-type="doi">10.1126/science.aba7612</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Preissl</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lucero</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Comprehensive analysis of single cell ATAC-seq data with SnapATAC</article-title>. <source>Nat. Commun.</source> <volume>12</volume>, <fpage>1337</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-021-21583-9</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fornes</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Castro-Mondragon</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>van der Lee</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Richmond</surname>
<given-names>P. A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Jaspar 2020: Update of the open-access database of transcription factor binding profiles</article-title>. <source>Nucleic Acids Res.</source> <volume>48</volume>, <fpage>D87</fpage>&#x2013;<lpage>D92</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz1001</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Granja</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Corces</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Pierce</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>Bagdatli</surname>
<given-names>S. T.</given-names>
</name>
<name>
<surname>Choudhry</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>H. Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>ArchR is a scalable software package for integrative single-cell chromatin accessibility analysis</article-title>. <source>Nat. Genet.</source> <volume>53</volume>, <fpage>403</fpage>&#x2013;<lpage>411</lpage>. <pub-id pub-id-type="doi">10.1038/s41588-021-00790-6</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Granja</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Klemm</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>McGinnis</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Kathiria</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Mezger</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Corces</surname>
<given-names>M. R.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Single-cell multiomic analysis identifies regulatory programs in mixed-phenotype acute leukemia</article-title>. <source>Nat. Biotechnol.</source> <volume>37</volume>, <fpage>1458</fpage>&#x2013;<lpage>1465</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-019-0332-7</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hao</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Andersen-Nissen</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mauck</surname>
<given-names>W. M.</given-names>
<suffix>3rd</suffix>
</name>
<name>
<surname>Zheng</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Butler</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Integrated analysis of multimodal single-cell data</article-title>. <source>Cell</source> <volume>184</volume>, <fpage>3573</fpage>&#x2013;<lpage>3587.e29</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2021.04.048</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hicks</surname>
<given-names>S. C.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ni</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Purdom</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Risso</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>mbkmeans: Fast clustering for single cell data using mini-batch k-means</article-title>. <source>PLoS Comput. Biol.</source> <volume>17</volume>, <fpage>e1008625</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1008625</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ji</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Ji</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Single-cell regulome data analysis by SCRAT</article-title>. <source>Bioinformatics</source> <volume>33</volume>, <fpage>2930</fpage>&#x2013;<lpage>2932</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx315</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Harigaya</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>N. R.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Nonparametric single-cell multiomic characterization of trio relationships between transcription factors, target genes, and cis-regulatory regions</article-title>. <source>Cell Syst.</source> <volume>13</volume>, <fpage>737</fpage>&#x2013;<lpage>751.e4</lpage>. <pub-id pub-id-type="doi">10.1016/j.cels.2022.08.004</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kettenring</surname>
<given-names>J. R.</given-names>
</name>
</person-group> (<year>1971</year>). <article-title>Canonical analysis of several sets of variables</article-title>. <source>Biometrika</source> <volume>58</volume>, <fpage>433</fpage>&#x2013;<lpage>451</lpage>. <pub-id pub-id-type="doi">10.1093/biomet/58.3.433</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kiselev</surname>
<given-names>V. Y.</given-names>
</name>
<name>
<surname>Kirschner</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Schaub</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Andrews</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Yiu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chandra</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>SC3: Consensus clustering of single-cell RNA-seq data</article-title>. <source>Nat. Methods</source> <volume>14</volume>, <fpage>483</fpage>&#x2013;<lpage>486</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4236</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Korsunsky</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Millard</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Slowikowski</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Fast, sensitive and accurate integration of single-cell data with Harmony</article-title>. <source>Nat. Methods</source> <volume>16</volume>, <fpage>1289</fpage>&#x2013;<lpage>1296</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-019-0619-0</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Kuppe</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Ziegler</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kabgani</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Menzel</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Chromatin-accessibility estimation from single-cell ATAC-seq data with scOpen</article-title>. <source>Nat. Commun.</source> <volume>12</volume>, <fpage>6386</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-021-26530-2</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lieberman-Aiden</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>van Berkum</surname>
<given-names>N. L.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Imakaev</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ragoczy</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Telling</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Comprehensive mapping of long-range interactions reveals folding principles of the human genome</article-title>. <source>Science</source> <volume>326</volume>, <fpage>289</fpage>&#x2013;<lpage>293</lpage>. <pub-id pub-id-type="doi">10.1126/science.1181369</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Vert</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Noble</surname>
<given-names>W. S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Jointly embedding multiple single-cell omics measurements</article-title>. <source>Algorithms Bioinform</source> <volume>143</volume>, <fpage>10</fpage>. <pub-id pub-id-type="doi">10.4230/LIPIcs.WABI.2019.10</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lock</surname>
<given-names>E. F.</given-names>
</name>
<name>
<surname>Hoadley</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Marron</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Nobel</surname>
<given-names>A. B.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Joint and individual variation explained (JIVE) for integrated analysis of multiple data types</article-title>. <source>Ann. Appl. statistics</source> <volume>7</volume>, <fpage>523</fpage>&#x2013;<lpage>542</lpage>. <pub-id pub-id-type="doi">10.1214/12-AOAS597</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>LaFave</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Earl</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Chiang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Chromatin potential identified by shared single-cell profiling of RNA and chromatin</article-title>. <source>Cell</source> <volume>183</volume>, <fpage>1103</fpage>&#x2013;<lpage>1116.e20</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2020.09.056</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meng</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Basunia</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Peters</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Gholami</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Kuster</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Culhane</surname>
<given-names>A. C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Mogsa: Integrative single sample gene-set analysis of multiple omics data</article-title>. <source>Mol. Cell Proteomics</source> <volume>18</volume>, <fpage>S153</fpage>&#x2013;<lpage>S168</lpage>. <pub-id pub-id-type="doi">10.1074/mcp.TIR118.001251</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pliner</surname>
<given-names>H. A.</given-names>
</name>
<name>
<surname>Packer</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>McFaline-Figueroa</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Cusanovich</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Daza</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Aghamirzaie</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Cicero predicts cis-regulatory DNA interactions from single-cell chromatin accessibility data</article-title>. <source>Mol. Cell</source> <volume>71</volume>, <fpage>858</fpage>&#x2013;<lpage>871.e8</lpage>. <pub-id pub-id-type="doi">10.1016/j.molcel.2018.06.044</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pott</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lieb</surname>
<given-names>J. D.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>What are super-enhancers?</article-title> <source>Nat. Genet.</source> <volume>47</volume>, <fpage>8</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3167</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rao</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Huntley</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Durand</surname>
<given-names>N. C.</given-names>
</name>
<name>
<surname>Stamenova</surname>
<given-names>E. K.</given-names>
</name>
<name>
<surname>Bochkov</surname>
<given-names>I. D.</given-names>
</name>
<name>
<surname>Robinson</surname>
<given-names>J. T.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>A 3D map of the human genome at kilobase resolution reveals principles of chromatin looping</article-title>. <source>Cell</source> <volume>159</volume>, <fpage>1665</fpage>&#x2013;<lpage>1680</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2014.11.021</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Romano</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Vinh</surname>
<given-names>N. X.</given-names>
</name>
<name>
<surname>Bailey</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Verspoor</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Adjusting for chance clustering comparison measures</article-title>. <source>J. Mach. Learn. Res.</source> <volume>17</volume>, <fpage>4635</fpage>&#x2013;<lpage>4666</lpage>.</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Satija</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Farrell</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Gennert</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Schier</surname>
<given-names>A. F.</given-names>
</name>
<name>
<surname>Regev</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Spatial reconstruction of single-cell gene expression data</article-title>. <source>Nat. Biotechnol.</source> <volume>33</volume>, <fpage>495</fpage>&#x2013;<lpage>502</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.3192</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Satpathy</surname>
<given-names>A. T.</given-names>
</name>
<name>
<surname>Granja</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Yost</surname>
<given-names>K. E.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Meschi</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>McDermott</surname>
<given-names>G. P.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Massively parallel single-cell chromatin landscapes of human immune cell development and intratumoral T cell exhaustion</article-title>. <source>Nat. Biotechnol.</source> <volume>37</volume>, <fpage>925</fpage>&#x2013;<lpage>936</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-019-0206-z</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schep</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Buenrostro</surname>
<given-names>J. D.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Greenleaf WJ: chromVAR: Inferring transcription-factor-associated accessibility from single-cell epigenomic data</article-title>. <source>Nat. Methods</source> <volume>14</volume>, <fpage>975</fpage>&#x2013;<lpage>978</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4401</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shlyueva</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Stampfel</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Stark</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Transcriptional enhancers: From properties to genome-wide predictions</article-title>. <source>Nat. Rev. Genet.</source> <volume>15</volume>, <fpage>272</fpage>&#x2013;<lpage>286</lpage>. <pub-id pub-id-type="doi">10.1038/nrg3682</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>D-CCA: A decomposition-based canonical correlation analysis for high-dimensional datasets</article-title>. <source>J. Am. Stat. Assoc.</source> <volume>115</volume>, <fpage>292</fpage>&#x2013;<lpage>306</lpage>. <pub-id pub-id-type="doi">10.1080/01621459.2018.1543599</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Street</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Risso</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Fletcher</surname>
<given-names>R. B.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Ngai</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yosef</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Slingshot: Cell lineage and pseudotime inference for single-cell transcriptomics</article-title>. <source>BMC Genomics</source> <volume>19</volume>, <fpage>477</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-018-4772-0</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stuart</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Butler</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hoffman</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Hafemeister</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Papalexi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mauck</surname>
<given-names>W. M.</given-names>
<suffix>3rd</suffix>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Comprehensive integration of single-cell data</article-title>. <source>Cell</source> <volume>177</volume>, <fpage>1888</fpage>&#x2013;<lpage>1902.e21</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2019.05.031</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stuart</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Srivastava</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Madad</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lareau</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Satija</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Single-cell chromatin state analysis with Signac</article-title>. <source>Nat. Methods</source> <volume>18</volume>, <fpage>1333</fpage>&#x2013;<lpage>1341</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-021-01282-5</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Traag</surname>
<given-names>V. A.</given-names>
</name>
<name>
<surname>Waltman</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>van Eck</surname>
<given-names>N. J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>From Louvain to leiden: Guaranteeing well-connected communities</article-title>. <source>Sci. Rep.</source> <volume>9</volume>, <fpage>5233</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-41695-z</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Urrutia</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Destin: Toolkit for single-cell analysis of chromatin accessibility</article-title>. <source>Bioinformatics</source> <volume>35</volume>, <fpage>3818</fpage>&#x2013;<lpage>3820</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz141</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Integrative analyses of single-cell transcriptome and regulome using MAESTRO</article-title>. <source>Genome Biol.</source> <volume>21</volume>, <fpage>198</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-020-02116-x</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Welch</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Kozareva</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Vanderburg</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Martin</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Macosko</surname>
<given-names>E. Z.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Single-cell multi-omic integration compares and contrasts features of brain cell identity</article-title>. <source>Cell</source> <volume>177</volume>, <fpage>1873</fpage>&#x2013;<lpage>1887.e17</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2019.05.006</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Westerhuis</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Kourti</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>MacGregor</surname>
<given-names>J. F.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Analysis of multiblock and hierarchical PCA and PLS models</article-title>. <source>J. Chemom. A J. Chemom. Soc.</source> <volume>12</volume>, <fpage>301</fpage>&#x2013;<lpage>321</lpage>. <pub-id pub-id-type="doi">10.1002/(sici)1099-128x(199809/10)12:5&#x3c;301:aid-cem515&#x3e;3.0.co;2-s</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Witten</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>A penalized matrix decomposition, with applications to sparse principal components and canonical correlation analysis</article-title>. <source>Biostatistics</source> <volume>10</volume>, <fpage>515</fpage>&#x2013;<lpage>534</lpage>. <pub-id pub-id-type="doi">10.1093/biostatistics/kxp008</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zappia</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Oshlack</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Clustering trees: A visualization for evaluating clusterings at multiple resolutions</article-title>. <source>Gigascience</source> <volume>7</volume>, <fpage>giy083</fpage>. <pub-id pub-id-type="doi">10.1093/gigascience/giy083</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Meyer</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Eeckhoute</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Bernstein</surname>
<given-names>B. E.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>Model-based analysis of ChIP-seq (MACS)</article-title>. <source>Genome Biol.</source> <volume>9</volume>, <fpage>R137</fpage>. <pub-id pub-id-type="doi">10.1186/gb-2008-9-9-r137</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>