<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fgene.2021.665888</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A Scalable Strand-Specific Protocol Enabling Full-Length Total RNA Sequencing From Single Cells</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Haile</surname> <given-names>Simon</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Corbett</surname> <given-names>Richard D.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1107482/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>LeBlanc</surname> <given-names>Veronique G.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wei</surname> <given-names>Lisa</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1227989/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Pleasance</surname> <given-names>Stephen</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Bilobram</surname> <given-names>Steve</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Nip</surname> <given-names>Ka Ming</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Brown</surname> <given-names>Kirstin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Trinh</surname> <given-names>Eva</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Smith</surname> <given-names>Jillian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Trinh</surname> <given-names>Diane L.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Bala</surname> <given-names>Miruna</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Chuah</surname> <given-names>Eric</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Coope</surname> <given-names>Robin J. N.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Moore</surname> <given-names>Richard A.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Mungall</surname> <given-names>Andrew J.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/529645/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Mungall</surname> <given-names>Karen L.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhao</surname> <given-names>Yongjun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Hirst</surname> <given-names>Martin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Aparicio</surname> <given-names>Samuel</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Birol</surname> <given-names>Inanc</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Jones</surname> <given-names>Steven J. M.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Marra</surname> <given-names>Marco A.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1224821/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Canada&#x2019;s Michael Smith Genome Sciences Centre, BC Cancer</institution>, <addr-line>Vancouver, BC</addr-line>, <country>Canada</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Molecular Oncology, BC Cancer</institution>, <addr-line>Vancouver, BC</addr-line>, <country>Canada</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Medical Genetics, University of British Columbia</institution>, <addr-line>Vancouver, BC</addr-line>, <country>Canada</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Eva Beate H&#x00F6;rmanseder, Helmholtz Zentrum M&#x00FC;nchen, Helmholtz-Gemeinschaft Deutscher Forschungszentren (HZ), Germany</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Rui Chen, Baylor College of Medicine, United States; Antonio Scialdone, Helmholtz Zentrum M&#x00FC;nchen, Helmholtz-Gemeinschaft Deutscher Forschungszentren (HZ), Germany</p></fn>
<corresp id="c001">&#x002A;Correspondence: Marco A. Marra, <email>mmarra@bcgsc.ca</email></corresp>
<fn fn-type="other" id="fn004"><p>This article was submitted to Genomic Assay Technology, a section of the journal Frontiers in Genetics</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>03</day>
<month>06</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>665888</elocation-id>
<history>
<date date-type="received">
<day>09</day>
<month>02</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>04</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2021 Haile, Corbett, LeBlanc, Wei, Pleasance, Bilobram, Nip, Brown, Trinh, Smith, Trinh, Bala, Chuah, Coope, Moore, Mungall, Mungall, Zhao, Hirst, Aparicio, Birol, Jones and Marra.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Haile, Corbett, LeBlanc, Wei, Pleasance, Bilobram, Nip, Brown, Trinh, Smith, Trinh, Bala, Chuah, Coope, Moore, Mungall, Mungall, Zhao, Hirst, Aparicio, Birol, Jones and Marra</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>RNA sequencing (RNAseq) has been widely used to generate bulk gene expression measurements collected from pools of cells. Only relatively recently have single-cell RNAseq (scRNAseq) methods provided opportunities for gene expression analyses at the single-cell level, allowing researchers to study heterogeneous mixtures of cells at unprecedented resolution. Tumors tend to be composed of heterogeneous cellular mixtures and are frequently the subjects of such analyses. Extensive method developments have led to several protocols for scRNAseq but, owing to the small amounts of RNA in single cells, technical constraints have required compromises. For example, the majority of scRNAseq methods are limited to sequencing only the 3&#x2032; or 5&#x2032; termini of transcripts. Other protocols that facilitate full-length transcript profiling tend to capture only polyadenylated mRNAs and are generally limited to processing only 96 cells at a time. Here, we address these limitations and present a novel protocol that allows for the high-throughput sequencing of full-length, total RNA at single-cell resolution. We demonstrate that our method produced strand-specific sequencing data for both polyadenylated and non-polyadenylated transcripts, enabled the profiling of transcript regions beyond only transcript termini, and yielded data rich enough to allow identification of cell types from heterogeneous biological samples.</p>
</abstract>
<kwd-group>
<kwd>full-length</kwd>
<kwd>total RNA</kwd>
<kwd>single-cell</kwd>
<kwd>RNAseq</kwd>
<kwd>cellenONE</kwd>
</kwd-group>
<contract-sponsor id="cn001">Canadian Cancer Society<named-content content-type="fundref-id">10.13039/501100000521</named-content></contract-sponsor><contract-sponsor id="cn002">Canadian Institutes of Health Research<named-content content-type="fundref-id">10.13039/501100000024</named-content></contract-sponsor><contract-sponsor id="cn003">Genome Canada<named-content content-type="fundref-id">10.13039/100008762</named-content></contract-sponsor><contract-sponsor id="cn004">Genome British Columbia<named-content content-type="fundref-id">10.13039/501100000233</named-content></contract-sponsor>
<counts>
<fig-count count="7"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="57"/>
<page-count count="16"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1">
<title>Introduction</title>
<p>Bulk RNA sequencing (RNAseq) is commonly used to study the average gene expression of cells within a population. The relatively recent introduction of single-cell RNAseq (scRNAseq) has provided insights into cell-level heterogeneity in biological samples in developing tissues (e.g., <xref ref-type="bibr" rid="B45">Scialdone et al., 2016</xref>) and tumors (e.g., <xref ref-type="bibr" rid="B51">Tirosh et al., 2016</xref>) at unprecedented resolution. It has become clear that to accurately assess the spatial and temporal patterns of gene expression in healthy and diseased cells, the profiling of samples at a single-cell resolution is vital.</p>
<p>The first step of scRNAseq is the isolation of individual cells, where capture efficiency remains a significant challenge. Several existing approaches include flow cytometry, limiting dilution, laser capture microdissection, and microfluidic techniques (<xref ref-type="bibr" rid="B27">Kolodziejczyk et al., 2015</xref>; <xref ref-type="bibr" rid="B56">Ziegenhain et al., 2017</xref>). Others involve the trapping of single cells within droplets followed by on&#x2013;bead or in-droplet molecular barcoding of cells (<xref ref-type="bibr" rid="B27">Kolodziejczyk et al., 2015</xref>; <xref ref-type="bibr" rid="B56">Ziegenhain et al., 2017</xref>). Approaches differ in their cost, efficiency, starting material type and number of cells required while low capture efficiencies and cell size restrictions of microfluidic approaches remain a challenge (<xref ref-type="bibr" rid="B27">Kolodziejczyk et al., 2015</xref>; <xref ref-type="bibr" rid="B56">Ziegenhain et al., 2017</xref>; <xref ref-type="bibr" rid="B8">Cao et al., 2017</xref>, <xref ref-type="bibr" rid="B9">2019</xref>). To address some of these shortcomings, <xref ref-type="bibr" rid="B8">Cao et al. (2017)</xref> developed a combinatorial cell indexing approach uniquely free of both single cell isolation or compartmentalization techniques (<xref ref-type="bibr" rid="B8">Cao et al., 2017</xref>, <xref ref-type="bibr" rid="B9">2019</xref>).</p>
<p>Regardless of the method used for single cell isolation, scRNAseq protocols are further limited by the amount of RNA in single cells. Since the first scRNAseq method was published by <xref ref-type="bibr" rid="B49">Tang et al. (2009)</xref>, several approaches have been developed to improve RNA capture efficiency. Even so, scRNAseq protocols are generally limited to capturing only the 3&#x2032;or 5&#x2032; ends of transcripts (<xref ref-type="bibr" rid="B27">Kolodziejczyk et al., 2015</xref>) and therefore remain best suited for transcript counting, but not for examining transcript structures such as splice variants and fusion transcripts, as are often found in cancers. Furthermore, protocols tend to capture only polyadenylated (polyA<sup>+</sup>) transcripts and therefore exclude non-polyadenylated (polyA<sup>&#x2013;</sup>) transcripts, including some non-coding RNAs. Finally, commonly used scRNAseq protocols do not provide strand-orientation information. Discriminating sense and antisense overlapping transcripts has been important in studies of antisense expression (e.g., <xref ref-type="bibr" rid="B3">Balbin et al., 2015</xref>).</p>
<p>The SMART-seq protocol, which employs the Fluidigm C1 System (<xref ref-type="bibr" rid="B15">Durruthy-Durruthy and Ray, 2018</xref>), yields data appropriate for full-length transcript analyses but only for polyA<sup>+</sup> mRNAs. Recently, <xref ref-type="bibr" rid="B23">Hayashi et al. (2018)</xref> reported a scRNAseq protocol that also employed the Fluidigm C1 System, but as it only allowed for processing of up to 96 cells per run, sensitivity to minor cell populations is low (<xref ref-type="bibr" rid="B23">Hayashi et al., 2018</xref>), thus constraining the technique to samples with limited heterogeneity. Moreover, both protocols are strand-agnostic, which is known to lead to inaccurate transcript quantification and does not readily allow for studies of anti-sense RNA biology (<xref ref-type="bibr" rid="B35">Mills et al., 2013</xref>; <xref ref-type="bibr" rid="B46">Sigurgeirsson et al., 2014</xref>; <xref ref-type="bibr" rid="B55">Zhao et al., 2015</xref>).</p>
<p>To better profile gene expression at single-cell resolution, a high-throughput, strand-specific protocol with minimal 3&#x2032; or 5&#x2032; bias that extends sequence results beyond polyA<sup>+</sup> RNA is needed. Here, we report a method that addresses the aforementioned limitations, and demonstrate its capacity to process over 1,000 cells per run. This protocol enables full-length, strand-specific sequencing of total RNA at single-cell resolution, providing researchers with an avenue for a more complete analysis of gene expression in heterogeneous biological samples.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>Cell Line and RNA Samples</title>
<p>Universal Human Reference (UHR) total RNA was obtained from Stratagene (Cat. No.740000) and quantified using the Agilent RNA 6000 Nano Kit (Cat. No.5067-1511). For the input titration experiments shown in <xref ref-type="fig" rid="F1">Figure 1</xref>, UHR was spiked with External RNA Controls Consortium (ERCC) spike-in mix 1 from Ambion (Cat. No.4456740) where 0.02 &#x03BC;L of the spike-in mix (&#x223C;1.035 moles) was used per 1 &#x03BC;g UHR total RNA. For the single-cell experiments, an equivalent of 1 &#x03BC;L of one million-fold dilution of the ERCC mix 1 stock (&#x223C;0.1 attomoles) was used per well. The immortalized Normal Human Astrocyte (NHA) cell line (<xref ref-type="bibr" rid="B47">Sonoda et al., 2001</xref>) was obtained from Applied Biological Materials (ABM) Inc (T3022; Richmond, BC, Canada) while the Human Peripheral Blood Mononuclear Cells (PBMCs) were purchased from STEMCELL Technologies (Cat. No.70025.1).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>DLP-scRNAseq workflow. Following single-cell isolation using the CellenONE automated cell spotter and lysis, RNA was fragmented using magnesium ion-dependent heating. Adapters containing 5&#x2032;- and 3&#x2032;-end sequencing primer targets were introduced sequentially as part of the cDNA synthesis steps, thereby achieving strand-specificity. Cell-specific barcodes were introduced in the first round of PCR (Index PCR). All steps up to Index PCR were performed in nanoliter-scale wells (Nanoliter platform). PCR products were then pooled and subsequent steps including rRNA depletion were performed in 96-well plate format (Microliter platform). Figure was created using <ext-link ext-link-type="uri" xlink:href="https://biorender.com">biorender.com</ext-link>.</p></caption>
<graphic xlink:href="fgene-12-665888-g001.tif"/>
</fig>
</sec>
<sec id="S2.SS2">
<title>Sample Preparation for RNAseq</title>
<sec id="S2.SS2.SSS1">
<title>Standard and Modified RNaseH rRNA Depletion</title>
<p>Standard RNaseH rRNA depletion was applied to 1&#x2013;10 ng of total RNA as described previously (<xref ref-type="bibr" rid="B21">Haile et al., 2017a</xref>, <xref ref-type="bibr" rid="B20">2019</xref>) except that half of the rRNA probe amount was used. Upstream DNase I treatment was omitted as the probe removal DNase treatment step that is integrated into the rRNA depletion kit was found to be sufficient for removing residual gDNA contamination.</p>
<p>For modified RNase H-based rRNA depletion, unpurified RNA following rRNA depletion was incubated at 95&#x00B0;C for 10 min without EDTA to heat-inactivate the DNase and to fragment the RNA in a Mg<sup>2+</sup>-dependent manner (Mg<sup>2+</sup> is part of DNase reaction buffer as a cofactor for the enzyme). The amount of rRNA probe used was half of the standard amount for 1&#x2013;10 ng total RNA and fivefold less than the standard amount for &#x003C; 1 ng total RNA. Following the rRNA depletion, DNase I treatment, and RNA fragmentation steps, first-strand cDNA synthesis was performed directly without purification to remove contaminants from upstream reactions. The first-strand buffer amount was adjusted to account for the buffers in the upstream reactions and was spiked with DTT to a final concentration of 2.5 mM as is standard for first strand cDNA synthesis. cDNA synthesis and library construction steps were performed as described previously (<xref ref-type="bibr" rid="B20">Haile et al., 2019</xref>). PCR was performed using 15 and 18 cycles for 1&#x2013;10 ng and 0.1&#x2013;0.25 ng total RNA input, respectively.</p>
</sec>
<sec id="S2.SS2.SSS2">
<title>SMART-Seq_v4</title>
<p>SMART-Seq v4 Ultra Low input RNA for sequencing (Cat. No. 634888; Takara Bio Inc) was used according to the manufacturer&#x2019;s recommendations. PCR was done using 14 cycles for 0&#x2013;250 pg total RNA input, 10 cycles for 1 ng, and 7 cycles for 5&#x2013;10 ng. Following purification of the PCR reactions, 150 pg of amplified cDNA was used for library construction using the Nextera XT DNA Library Preparation Kit (Cat. No. FC-131-1024; Illumina) as per the manufacturer&#x2019;s recommendations.</p>
</sec>
<sec id="S2.SS2.SSS3">
<title>PolyA-Based RNAseq and Exome RNAseq</title>
<p>PolyA-based libraries were constructed as described previously (17). For exome RNAseq, total RNA was directly used for cDNA synthesis and library construction steps as described previously (<xref ref-type="bibr" rid="B22">Haile et al., 2017b</xref>). PCR was done using 15 cycles to amplify 0&#x2013;250 pg RNA and 13 cycles to amplify 1&#x2013;10 ng. Following purification of the PCR reactions, 500 ng of amplified libraries were used for exome capture as described previously (<xref ref-type="bibr" rid="B13">Cieslik et al., 2015</xref>).</p>
</sec>
<sec id="S2.SS2.SSS4">
<title>SMARTer Bulk Total RNAseq</title>
<p>SMARTer<sup>&#x00AE;</sup> Stranded Total RNAseq Kit v2&#x2013;Pico Input Mammalian (Cat. No. 634413; Takara Bio Inc.) was used as per the manufacturer&#x2019;s instructions when the starting material was total RNA. PCR was done using 16 cycles of PCR to amplify 0&#x2013;250 pg of RNA, 14 cycles to amplify 1 ng, and 12 cycles to amplify 5&#x2013;10 ng.</p>
<p>For bulk RNAseq, 10&#x2013;500 cells, based on hemocytometer cell counting, were first washed and resuspended in 2 &#x03BC;L of 1&#x00D7; PBS and were mixed with 6 &#x03BC;L of 1&#x00D7; lysis buffer (Cat. No. 635013; Takara Bio Inc) containing 0.5% RNase inhibitor (Cat. No. 635013; Takara Bio Inc). The rest of the steps were performed according to the manufacturer&#x2019;s instructions in the supplementary Pico v2 protocol for intact-cell inputs (Takara Bio Inc). Prior to rRNA depletion, 5 cycles of PCR were used to amplify cDNA fragments. Following rRNA depletion, 18 cycles of PCR were used for 10 cells and 14 cycles for 500 cells.</p>
</sec>
<sec id="S2.SS2.SSS5">
<title>Direct Library Preparation (DLP)-Based Single Cell Total RNAseq (DLP-scRNAseq)</title>
<p>Cell spotting was performed using the cellenONE (Cellenion) platform as previously described for the Direct Library Preparation Plus (DLP+) single-cell genome sequencing protocol (<xref ref-type="bibr" rid="B28">Laks et al., 2019</xref>). For single cells, the upstream RNAseq preparation steps including cell lysis, RNA fragmentation, cDNA synthesis and adapter addition were performed as described above for the SMARTer bulk protocol, but generally with volumes in nanoliters as opposed to microliters. The step-by-step details of the protocol are attached in <xref ref-type="supplementary-material" rid="S8">Supplementary Text File</xref> (pages 5&#x2013;29). For optimal spotting of reaction mixes other than the lysis/fragmentation mix, 0.05% Tween-20 was spiked into the reactions. Reaction mixes and primers were filtered using spin-x columns (Cat. No. CLS8162; Merck) whenever spotting proved to be problematic. All steps up to and including the introduction of cell-specific indices during the first round of PCR (pre-rRNA depletion), were performed in nanoliter volumes using Takara Smart Chips (Takara Bio Inc). These arrays consist of a 72 &#x00D7; 72 (5184) well layout each of which able to hold a volume of approximately 100 nl. After 5 cycles of the first round of PCR, the chip was inverted and spun down to pool all reactions into one tube. Subsequent steps were performed according to the SMARTer Stranded Total RNAseq Kit v2&#x2013;Pico Input Mammalian manufacturer&#x2019;s instructions.</p>
<p>The SMARTer<sup>&#x00AE;</sup> kit comes with indexing primers that allow the barcoding of a maximum of 96 samples. To increase the number of cells that could be processed, we designed our own barcodes based on the following requirements: (1) the random primer and strand-switching oligos were to be anchored to Illumina sequencing primer sequences, and (2) primers used for the first round of PCR must have complementary sequences to the Illumina sequencing primer anchors internally, followed by indices in the middle, and P5/P7 priming sites at their distal ends. We thus designed 72 &#x00D7; 72 dual indexing primers enabling 5184 unique cell-specific barcodes (<xref ref-type="supplementary-material" rid="S8">Supplementary Table 1</xref>).</p>
</sec>
</sec>
<sec id="S2.SS3">
<title>Sequencing and Bioinformatic Analysis</title>
<p>We generated the following libraries using the DLP-scRNAseq: 402 single NHA cells with the same indexing primers, 92 single NHA cells with unique cell-specific primers, and triplicates of no-cell negative controls and positive control 5 pg UHR total RNA. These libraries were pooled into one tube, which we referred to as the nano-pool. We also prepared the following libraries in the microliter platform: 10 NHA cells in bulk, 500 NHA cells in bulk as well as a single replicate of 4 ng total UHR.</p>
<p>The DLP-scRNAseq NHA pool (0.5&#x00D7;), the bulk SMARTer NHA 500 cells (0.2&#x00D7;), the bulk NHA 10 cells (0.2&#x00D7;), and the bulk UHR (0.1&#x00D7;) were pooled and sequenced on one lane of an Illumina HiSeq 2500 flowcell (paired end 75 bp).</p>
<sec id="S2.SS3.SSS1">
<title>JAGuaR Alignment</title>
<p>Sequence analysis was performed as described previously (<xref ref-type="bibr" rid="B21">Haile et al., 2017a</xref>, <xref ref-type="bibr" rid="B22">b</xref>, <xref ref-type="bibr" rid="B20">2019</xref>), and briefly involved alignment of reads to the hg19 reference genome in combination with Ensembl 69 gene models using the JAGuaR junction-aware alignment pipeline (<xref ref-type="bibr" rid="B7">Butterfield et al., 2014</xref>) using the &#x201C;mem&#x201D; alignment option in place of &#x201C;aln.&#x201D; Gene expression values were calculated exactly as described in <xref ref-type="bibr" rid="B21">Haile et al. (2017a</xref>, <xref ref-type="bibr" rid="B22">b</xref>, <xref ref-type="bibr" rid="B20">2019)</xref>. Briefly, the read chastity status was first marked with custom scripts and duplicates were marked with Sambamba 0.5.5 (<xref ref-type="bibr" rid="B50">Tarasov et al., 2015</xref>). Reads were then split into positive- and negative-strand BAM files, analyzed for depth of reads after converting to wig files, and finally reads per kilobases per million (RPKM) values were generated from these counts.</p>
<p>When comparing results for non-single-cell libraries, we control for depth-related variables by down-sampling the original BAM files to obtain approximately equal numbers of reads for each library. Down-sampled read alignments were subsequently enumerated to generate an expression matrix of sample-by-gene RPKM estimates that were then used in correlation analyses to evaluate the similarities in expression profiles across samples and protocols.</p>
<p>Sequencing data is deposited at Sequence Read Archive (SRP286135).</p>
</sec>
<sec id="S2.SS3.SSS2">
<title>STAR Alignments</title>
<p>RNA read alignments were performed with STAR 2.7.3a (<xref ref-type="bibr" rid="B14">Dobin et al., 2013</xref>) in 2-pass mode after detecting adapter sequence using bbmerge (<xref ref-type="bibr" rid="B6">Bushnell et al., 2017</xref>) and trimming with cutadapt version 1.16 (<xref ref-type="bibr" rid="B11">Chen et al., 2018</xref>). TPM expression estimates were generated from the STAR alignments using Stringtie (<xref ref-type="bibr" rid="B39">Pertea et al., 2015</xref>).</p>
</sec>
<sec id="S2.SS3.SSS3">
<title>Comparison With qPCR Data</title>
<p>UHR qPCR data from the MicroArray Quality Control project (GSE5350) (<xref ref-type="bibr" rid="B33">MAQC Consortium et al., 2006</xref>) were downloaded for comparison to our expression results. Using samples GSM129638-GSM129641, expression estimates were matched by gene name between our RPKM values and the published qPCR estimates. Each sample was correlated with all four replicate qPCR data sets, from which a median Pearson correlation was calculated.</p>
</sec>
<sec id="S2.SS3.SSS4">
<title>Exon-Level Analysis</title>
<p>For exon analysis, BAM files were generated from aligning reads (read 1&#x0026;2 lengths of 69 bp for single-cell libraries and read 1&#x0026;2 length of 75 bp for bulk libraries) using JAGuaR as described above.</p>
<p>Exon quantification was performed for full exons as well as partial exons that fell within the 3&#x2032; and 5&#x2032; untranslated regions (UTRs) of annotated transcripts. Partial exon means only part of an exon falls within either the 3&#x2032; or 5&#x2032; UTR of a transcript. The analysis was performed using the following R packages: <italic>GenomicFeatures</italic> (v1.26.4), <italic>GenomicRanges</italic> (v1.26.4), <italic>Rsamtools</italic> (v1.26.2), <italic>IRanges</italic> (2.8.2), and <italic>GenomicAlignments</italic> (v1.10.1). All exon start and end locations and their associated transcript and gene IDs were retrieved from the Ensembl databases using the functions <italic>makeTxDbFromUCSC</italic> and <italic>exons</italic> from <italic>GenomicFeatures</italic>. The functions <italic>fiveUTRsByTranscript</italic> and <italic>threeUTRsByTranscript</italic> from <italic>GenomicFeatures</italic> were used to extract the start and end coordinates of full or partial exons that constituted the 3&#x2032;UTR or 5&#x2032;UTR regions of each transcript.</p>
<p>Non-duplicate paired-end reads were imported from the BAM files using <italic>readGAlignmentPairs</italic> from <italic>GenomicAlignments</italic>. A second filtering step was applied to keep only reads that aligned to genomic locations that did not fall exclusively within 100 bp of the start and end of each chromosome. The second filtering step was applied to avoid the confounding effects of telomeric repeats on read mapping. The number of reads that overlapped with each exon, or each exonic region within the 3&#x2032;UTR or 5&#x2032;UTR of transcripts, was quantified using the <italic>countOverlaps</italic> function from the <italic>IRanges</italic> package. A read could map to multiple exons or exonic regions if its genomic coordinates overlapped with the coordinates of more than one region. For expression-based comparisons of expression levels, exon counts were normalized for sequencing depth using <italic>calcNormFactors</italic> and converted to RPKM using the <italic>rpkm</italic> function from <italic>edgeR</italic> v3.24.3.</p>
</sec>
<sec id="S2.SS3.SSS5">
<title>PBMC Clustering Analysis</title>
<p>For the PBMC clustering analysis, the fastq file for the 10X PBMC data was obtained from the 10X website<sup><xref ref-type="fn" rid="footnote1">1</xref></sup>, and the CellRanger pipeline (v3.0.2) was used to obtain a count matrix for 1,223 cells, aligning to hg19 (v3.0.0<sup><xref ref-type="fn" rid="footnote2">2</xref></sup>). Data preprocessing was performed in R, based on the count matrices output by HTSeq (<xref ref-type="bibr" rid="B1">Anders et al., 2015</xref>) using the JAGuaR-based read alignments (DLP-scRNAseq data) or by the CellRanger pipeline (10X data). For the DLP-scRNAseq dataset, counts from all wells identified as containing a cell (<italic>n</italic> = 517) were combined into a single count matrix. Outliers were identified based on total read counts, total number of genes detected, and the percent of counts coming from ERCC spike-ins for DLP-scRNAseq, as previously described (<xref ref-type="bibr" rid="B31">Lun A.T et al., 2016</xref>). For each of these metrics, cells with lower (read counts and genes detected) or higher (percent of counts from ERCCs) than three median absolute deviations from the median were considered outliers (<italic>n</italic> = 56 for the DLP-scRNAseq dataset; <italic>n</italic> = 94 for the 10X dataset). After cell filtering, genes with at least one read count in at least two cells were retained, resulting in a final datasets with 461 cells and 16,642 genes (DLP-scRNAseq) and 1,129 cells and 15,982 genes (10X). Normalization was then applied to all cells using the <italic>scran</italic> package (V1.10.1) (<xref ref-type="bibr" rid="B31">Lun A.T et al., 2016</xref>). The <italic>quickCluster</italic> function was used to cluster cells for normalization with min.mean = 0.1 for the DLP-scRNAseq dataset, as suggested for read count data, and 0.01 for the 10X dataset, as suggested for UMI data. Resulting clusters were used as input to the <italic>computeSpikeFactors</italic> (DLP-scRNAseq, with ERCC reads labeled as spike-ins) or <italic>computeSumFactors</italic> (10X) function. These factors were then used in the <italic>normalize</italic> function of the <italic>scater</italic> R package (v1.10.0) to obtain normalized expression values that were used for downstream analyses.</p>
<p>Cell clustering was performed largely as described previously (<xref ref-type="bibr" rid="B32">Lun A.T.L. et al., 2016</xref>). Highly variable genes (HVGs) were first identified using the <italic>trendVar</italic> function of the <italic>scran</italic> R package with <italic>parametric</italic> set to TRUE, a span of 0.3 for the LOESS fitting, and min.mean set to 0.1 (DLP-scRNAseq) or 0.01 (10X). The <italic>decomposeVar</italic> function was then used to decompose gene-specific variances into biological and technical components, and genes with a biological component &#x003E;0.1 and a Benjamini-Hochberg-corrected <italic>p</italic> &#x003C; 0.05 were considered HVGs. Principal component analysis (PCA) was performed using the <italic>parallelPCA</italic> function on the normalized expression matrix containing only HVGs, and 1,000 permutation iterations were performed to identify significant principal components (PCs). Briefly, this function permutes the expression vector for each gene and repeats the PCA to calculate the fraction of variance explained by each PC (up to 100) under a random null model; all PCs from the first PC where the permuted fractions exceed the observed fraction of variance in more than 10% of iterations (the default threshold) are then discarded, and earlier PCs are retained as &#x201C;significant PCs&#x201D; (with a minimum of five). A shared nearest neighbor graph (<italic>k</italic> = 15) was then obtained using the <italic>buildSNNGraph</italic> function based on the PCA reduction (with six and seven significant PCs for the DLP-scRNAseq and 10X datasets, respectively), and the <italic>cluster_walktrap</italic> function from the <italic>igraph</italic> R package (v1.2.2) was used to identify clusters.</p>
<p>Marker genes with high expression in individual clusters were identified using the <italic>overlapExprs</italic> function from <italic>scran</italic>, which performs Wilcoxon rank-sum tests between each pair of clusters and then calculates a combined <italic>p</italic>-value using Sime&#x2019;s method. The tSNE plots used for visualization were obtained using the <italic>Rtsne.multicore</italic> R package (v0.0.99) with perplexity = 50, theta = 0.0, and a maximum of 2,000 iterations, based on the significant PCs described above. The correlation analysis to reference cell types was performed using the <italic>SingleR</italic> (v0.2.0) (<xref ref-type="bibr" rid="B2">Aran et al., 2019</xref>) tool in R with the LM22 matrix (<xref ref-type="bibr" rid="B37">Newman et al., 2015</xref>) as a reference. For this analysis, normalized expression values from the DLP-scRNAseq dataset were further normalized for gene length using the approach described in <xref ref-type="bibr" rid="B43">Reid et al. (2018)</xref>.</p>
</sec>
<sec id="S2.SS3.SSS6">
<title>PBMC Alternative Splicing Analysis</title>
<p>Splicing patterns were first quantified in individual cells using BRIE (<xref ref-type="bibr" rid="B24">Huang and Sanguinetti, 2017</xref>) and the lenient annotations provided by the tool&#x2019;s authors (Gencode v19<sup><xref ref-type="fn" rid="footnote3">3</xref></sup>). Differential splicing was then performed between each pair of cells using default parameters. Events with a Bayes factor &#x2265;10 and a difference in the proportion of spliced isoform (&#x0394;PSI) &#x003E; 0.2 were considered to be differentially spliced (<xref ref-type="bibr" rid="B5">Bray et al., 2016</xref>). For each pair of cell types, the total possible number of events was calculated as follows: # of cells in cell type 1 &#x00D7; # of cells in cell type 2 &#x00D7; # of unique transcripts in the annotation file.</p>
<p>To identify cell type-specific alternative splicing events, we first pooled reads from all cells assigned to the same cell type. BRIE was then used to quantify events in each cell type and perform differential splicing analyses between each pair of cell types using default parameters. Events with a Bayes factor &#x2265;10 were considered to be differentially spliced between cell types (<xref ref-type="bibr" rid="B24">Huang and Sanguinetti, 2017</xref>) and events that were specific to one cell type (i.e., had a higher or lower PSI than all other cell types) were identified (<xref ref-type="supplementary-material" rid="S8">Supplementary Table 3</xref>). Sashimi plots were created using the script provided with the <italic>briekit</italic> tool<sup><xref ref-type="fn" rid="footnote4">4</xref></sup> using default parameters.</p>
</sec>
<sec id="S2.SS3.SSS7">
<title>ERCC Spike-in Analysis</title>
<p>ERCC alignment and sensitivity analysis were performed using seqtk (default parameters)<sup><xref ref-type="fn" rid="footnote5">5</xref></sup> to down-sample the fastq files when matching depths were required. Fastp (<xref ref-type="bibr" rid="B11">Chen et al., 2018</xref>) was used to detect and trim adapters, after which alignment and gene expression quantification were performed with Kallisto (<xref ref-type="bibr" rid="B17">Falcao et al., 2018</xref>). Sensitivity analysis was performed using logistic regression as outlined in <xref ref-type="bibr" rid="B48">Svensson et al. (2017)</xref>. A Nextflow script orchestrating these operations across folders of fastqs is available at <ext-link ext-link-type="uri" xlink:href="https://svn.bcgsc.ca/bitbucket/projects/RCORBETT/repos/single_cell_rna/browse">https://svn.bcgsc.ca/bitbucket/projects/RCORBETT/repos/single_cell_rna/browse</ext-link> where the R scripts used to make related figures can also be found.</p>
</sec>
<sec id="S2.SS3.SSS8">
<title>Enhancer and Circular RNA Analyses</title>
<p>Enhancer RNA analysis was performed as described in <xref ref-type="bibr" rid="B23">Hayashi et al. (2018)</xref> using the JAGuaR alignments as the starting point. Circular RNA detection was performed with CIRIquant (<xref ref-type="bibr" rid="B54">Zhang et al., 2020</xref>) for which a Nextflow script and associated R notebook are available at <ext-link ext-link-type="uri" xlink:href="https://svn.bcgsc.ca/bitbucket/projects/RCORBETT/repos/single_cell_rna/browse">https://svn.bcgsc.ca/bitbucket/projects/RCORBETT/repos/single_cell_rna/browse</ext-link>.</p>
</sec>
</sec>
</sec>
<sec id="S3">
<title>Results and Discussion</title>
<p>Here, we address limitations of current scRNAseq approaches, pursuing two aims: (1) identification and optimization of a strand-specific scRNAseq protocol that offers the potential of full-length transcript analysis of both polyA<sup>+</sup> and polyA<sup>&#x2013;</sup> RNAs on Illumina sequencing instruments, and (2) the potential for automation of such a protocol on a platform that allows for high-throughput processing of various cell types with acceptable recovery of single cells and sequencing data quality.</p>
<sec id="S3.SS1">
<title>Requirements for a Strand-Specific Total RNA scRNAseq Protocol</title>
<p>Random priming of cDNA synthesis was chosen to enable total RNA sequencing, the result of which required both removal of ribosomal RNAs (rRNAs) without loss of cell-specific indexing, and the generation of small sequencing template fragments appropriate for analysis on short-read sequencers. To achieve such fragments, the protocol design incorporated RNA fragmentation. From there, steps leading up to single cell-specific indexing were envisioned as occurring in one reaction vessel, without the need for purifications between protocol steps. The cDNA synthesis step was viewed as the earliest opportunity for cell-specific indexing, and so we preferred the possibility of performing rRNA depletion after cDNA synthesis.</p>
<p>We first conducted a literature search for protocols that met these requirements (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 1A</xref>), and identified or developed three protocols that met these criteria. The first protocol, hereafter referred to as SMARTer, is based on the SMARTer<sup>&#x00AE;</sup> Stranded Total RNAseq Kit (Takara Bio Inc). In this protocol, rRNA depletion relies on hybridization following the PCR amplification of cDNA fragments. Library construction is not ligation-based, as the introduction of priming sites for Illumina sequencing is integrated into the cDNA synthesis and amplification steps. The second protocol is a variation of an exome RNAseq method that was reported previously for bulk RNAseq (<xref ref-type="bibr" rid="B13">Cieslik et al., 2015</xref>). rRNA depletion is done using exome capture and occurs following PCR amplification of adapter-ligated cDNA fragments. The disadvantage of this protocol is that recovered transcripts were limited by probe sets matching annotated exons: transcripts lacking probe sets could not be recovered.</p>
<p>Previously, we showed that the RNaseH rRNA depletion protocol was optimal for low input RNA (<xref ref-type="bibr" rid="B21">Haile et al., 2017a</xref>, <xref ref-type="bibr" rid="B22">b</xref>, <xref ref-type="bibr" rid="B20">2019</xref>); however, that protocol involved a purification step following rRNA depletion, which occurred prior to cDNA synthesis. We modified this protocol by removing the purification step, thereby providing a third scRNAseq protocol for evaluation (referred to as the Modified RNaseH protocol). We also generated data using the SMART-Seq v4 (SMART_v4) Ultra Low input RNA for sequencing (Takara Bio Inc.), the latest commercial version of the Smart-seq2 protocol that is commonly used for scRNAseq (<xref ref-type="bibr" rid="B40">Picelli et al., 2013</xref>). However, this protocol does not meet the requirements mentioned above since it is strand-agnostic, is restricted to poly-A RNAs and is of smaller scale (maximum of 96 cells). We used these data as &#x201C;gold standard&#x201D; comparators to the data generated using other protocols, as described below.</p>
<p>We performed comparative analyses of the four protocols described above using Universal Human RNA (UHR) as total RNA input. UHR was spiked with synthetic RNAs from the External RNA Control Consortium (ERCC) at a constant proportion of the input amount to evaluate how well the observed RNA levels correlated with those expected theoretically (<xref ref-type="bibr" rid="B16">External RNA Controls Consortium, 2005</xref>). The SMART_v4 protocol and the standard RNaseH rRNA depletion protocol (<xref ref-type="bibr" rid="B21">Haile et al., 2017a</xref>, <xref ref-type="bibr" rid="B22">b</xref>, <xref ref-type="bibr" rid="B20">2019</xref>) served as our gold standards. Libraries were generated from total RNA input amounts ranging from 100 pg to 10 ng. Except for SMART_V4 and standard RNaseH, where one reaction was used for each of the indicated total RNA input amounts, duplicates were used for all the other protocols for each of the input amounts. Data from various post-sequencing and alignment metrics and expression comparisons are presented in <xref ref-type="supplementary-material" rid="S8">Supplementary Figures 2</xref>&#x2013;<xref ref-type="supplementary-material" rid="S8">9</xref> and are summarized in <xref ref-type="supplementary-material" rid="S8">Supplementary Figure 1B</xref>. We used the JAGuaR junction-aware alignment pipeline (<xref ref-type="bibr" rid="B7">Butterfield et al., 2014</xref>) for sequence analysis. Compared to STAR, we found that this pipeline enabled a higher mappability of reads to the human reference genome (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 2A</xref>) and a higher sensitivity in the detection of genes (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 2B</xref>) for all the libraries that were generated using the four protocols we described above.</p>
<p>The proportion of reads that aligned to the human genome reference (other than ribosomal RNA and mitochondrial RNA reads) was lowest for the modified RNaseH protocol (as low as 45% vs. &#x003E;82% for the other protocols) with minimal differences between the other protocols (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 3</xref>). The unaligned reads for the RNaseH protocol appear to result predominantly from microbial contamination. The non-exonic content was lowest for the exome and SMART_V4 protocols (&#x003C;8 and &#x003C; 6%, respectively, vs. &#x003E; 46% for the other protocols) (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 4</xref>). Consistent with a previous report (<xref ref-type="bibr" rid="B56">Ziegenhain et al., 2017</xref>), sensitivity of transcript detection and diversity were highest for the SMART_v4 protocol (<xref ref-type="supplementary-material" rid="S8">Supplementary Figures 1B</xref>, <xref ref-type="supplementary-material" rid="S8">5</xref>) but these advantages came at the cost of quantitative accuracy of transcript levels as demonstrated by lower expression correlation values with expected levels of ERCC transcripts, UHR expression values obtained using the standard RNaseH and polyA RNAseq protocols, and expression values of 1,000 genes that were previously (<xref ref-type="bibr" rid="B33">MAQC Consortium et al., 2006</xref>) quantified using qPCR, especially when compared with the SMARTer protocol. The SMARTer protocol gave the highest base error rate (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 1B</xref>) which appeared to be due to artifacts introduced at strand-switch sites (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 6</xref>). The proportion of properly paired reads for the SMARTer protocol (mean = 78%) was lower than that of the RNaseH protocol (mean = 89%) but higher than that of the SMART_v4 protocol (mean = 70%) (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 1B</xref>). Overall, the SMARTer protocol displayed higher accuracy in representing quantitative expression based on ERCC transcripts (<xref ref-type="supplementary-material" rid="S8">Supplementary Figures 1B</xref>, <xref ref-type="supplementary-material" rid="S8">7</xref>; lower panel), comparison with UHR expression values obtained using the standard RNaseH and polyA RNAseq protocols (<xref ref-type="supplementary-material" rid="S8">Supplementary Figures 1B</xref>, <xref ref-type="supplementary-material" rid="S8">7</xref>; upper panel), and relative to qPCR expression values of 1,000 genes (<xref ref-type="supplementary-material" rid="S8">Supplementary Figures 1B</xref>, <xref ref-type="supplementary-material" rid="S8">8</xref>). This protocol is also strand-specific (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 9</xref>), unlike most of the previously reported protocols for full-length scRNAseq (for example, the SMART_v4 protocol). Given these observations, we thus decided to further investigate the SMARTer protocol and its adaptability to a higher-throughput platform.</p>
</sec>
<sec id="S3.SS2">
<title>Adapting SMARTer to a Higher-Throughput, Strand-Specific Total RNA scRNAseq Protocol</title>
<p>To increase the throughput of the SMARTer protocol, we chose to adapt it to an open array platform from Scienion that integrates single-cell isolation with nanoliter reagent dispensing capacity. The instrument&#x2019;s cellenONE automated single-cell isolation feature uses piezo acoustic technology and optical monitoring of picodroplets to dispense cells: a droplet is dispensed into a waste recovery receptacle if the distal tip of the nozzle is automatically determined to contain no cell or multiple cells, or into a well if a single cell is found in the ejection zone. We adapted the instrument to dispense into a Wafergen chip (Takara) containing 5,184 nanoliter-scale wells, maximizing potential throughput and constraining reagent volumes to nanoliters in a fashion similar to that described previously for the Direct Library Preparation Plus (DLP+) single-cell genome protocol (<xref ref-type="bibr" rid="B28">Laks et al., 2019</xref>).</p>
<p>To determine the fidelity of single-cell dispensing, we stained cells and upon imaging of the chip, counted instances of no cell, single cell or multiple cells within individual wells. Based on seven independent runs, three different cell types and a total of 6,216 cells, post-imaging calls of single cells were made for 91&#x2013;98% of the wells (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 10</xref>). Importantly, all wells with multiple cells could be identified based on the image of unstained cells in the cell dispensing nozzle, and these could thus be excluded from downstream analyses. Given the protocol&#x2019;s high fidelity in delivering one cell per well, we adopted a staining-free protocol for our scRNAseq application. Modifications to the SMARTer protocol included expansion of the indexing capacity beyond 96 cells and workflow changes to enable early pooling of indexed cells before rRNA depletion and adaptation to our automated system as depicted in <xref ref-type="fig" rid="F1">Figure 1</xref>. We hereafter refer to this method as DLP-scRNAseq.</p>
</sec>
<sec id="S3.SS3">
<title>Comparison of DLP-scRNAseq With Bulk RNAseq and Orthogonal Assays</title>
<p>To examine the extent to which the DLP-scRNAseq protocol introduced artifacts affecting sequencing data quality or expression dynamics, we compared our single-cell data to data generated from populations of cells using the same protocol but in a 96-well format. Specifically, we compared 92 individually indexed cells and a pool of 402 individual cells with identical index, all of which were processed according to the DLP-scRNAseq protocol, to pools of 10 cells and 500 cells that were processed in bulk. An immortalized normal human astrocyte (NHA) cell line was used for these comparisons (<xref ref-type="bibr" rid="B47">Sonoda et al., 2001</xref>).</p>
<p>Analyses of sequencing quality (<xref ref-type="fig" rid="F2">Figure 2A</xref>) and quantification of the number of genes detected (<xref ref-type="fig" rid="F2">Figure 2B</xref>) indicated data of comparable quality between libraries generated using our DLP-scRNAseq protocol and those generated from bulk cell populations, suggesting that quality and gene detection were preserved as reaction volumes were reduced to nanoliter levels.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Comparisons of DLP-scRNAseq data and bulk RNAseq data and benchmarking using orthogonally generated data. <bold>(A)</bold> Alignment-based metrics of scRNAseq (DLP-scRNAseq) data vs. bulk (SMARTer) RNAseq data. 80 million reads were used for each data set. <bold>(B)</bold> Number of genes detected in DLP-scRNAseq data vs. bulk RNAseq data. 80 million reads were used. <bold>(C)</bold> Number of genes detected by at least one read in each of the 90 uniquely barcoded single cells (blue dots). Cells are sorted in ascending order based on number of reads. <bold>(D)</bold> Evaluation of sequencing saturation. Reads were down-sampled to numbers between 0.125 and 1.25 million and the number of genes with &#x003E;0 reads was enumerated at each sampling depth. Curve slopes are indicative of the yield of new genes sampled as a function of sequencing depth, with steeper slopes indicative of lower saturation levels. <bold>(E)</bold> Pearson correlation values comparing expression values from bulk-based RNAseq (SMARTer) data with DLP-scRNAseq data for UHR and NHA data. <bold>(F)</bold> Pearson correlations comparing DLP-scRNAseq and qPCR data (UHR) and known synthetic RNA measurements (ERCC).</p></caption>
<graphic xlink:href="fgene-12-665888-g002.tif"/>
</fig>
<p>Although DLP-scRNAseq libraries from two of the 92 individually indexed cells produced only 462 and 602 reads, respectively, reads from the remaining libraries yielded from 98,222 to 1,773,656 reads with an average of 757,791 reads per cell. The average number of expressed genes detected per cell was 7,371 (+/&#x2212; 903) (<xref ref-type="fig" rid="F2">Figure 2C</xref>). As shown in <xref ref-type="fig" rid="F2">Figure 2D</xref>, it appears that saturation of the number of genes detected was not reached at 1 million reads per cell.</p>
<p>Gene-level expression analysis showed that data from the DLP-scRNAseq pool of single cells were highly correlated with those of SMARTer libraries from bulk cells (Pearson&#x2019;s correlation = 0.82) (<xref ref-type="fig" rid="F2">Figure 2E</xref>). We included 5 pg UHR RNA in selected wells to represent the amount of RNA expected from a single cell. The Pearson correlation of gene-level expression from these 5 pg DLP-scRNAseq UHR libraries to bulk SMARTer libraries from 5 ng UHR total RNA input was 0.97&#x2013;0.98 (<xref ref-type="fig" rid="F2">Figure 2E</xref>), indicating good expression concordance between single-cell and bulk implementations of the method.</p>
<p>We further evaluated the accuracy of gene expression quantification, comparing the single-cell protocol to public qPCR data for 1,000 UHR genes and considered the expected expression levels of the 92 ERCC spike-in RNAs. The average Pearson correlation between the qPCR data and DLP-scRNAseq data for the 1,000 UHR genes was &#x003E;0.7 and the average correlation between expected and observed levels of ERCC RNAs was &#x003E;0.9 (<xref ref-type="fig" rid="F2">Figure 2F</xref>), once again indicating that the DLP-scRNAseq protocol generated accurate gene expression measurements.</p>
<p>To compare the sensitivity, accuracy and technical variability of DLP-scRNAseq, we compared counts of ERCC RNA-aligning reads in our protocol with those from publicly available gold standard full-length SMART-seq single-cell data (PRJEB20161, PRJEB20163, and PRJEB20166). To measure sensitivity, logistic regression to estimate the concentration at which an ERCC RNA had a 50% likelihood of being detected was applied as described previously (<xref ref-type="bibr" rid="B48">Svensson et al., 2017</xref>). The molecular limit of detection was derived from these results.</p>
<p>Based on an equivalent total number of reads (100,000 reads per cell), the median limit of detection with 50% probability was considerably lower for our protocol compared to datasets generated using SMART-seq protocols (50 vs. 268, 133, and 216) (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 11A</xref>). Pearson&#x2019;s correlation values of expected vs. observed ERCC RNA levels also indicated that our protocol was more accurate (median <italic>R</italic> = 0.84) than the SMART-seq protocols (median <italic>R</italic> = 0.68, 0.58, and 0.70, respectively) (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 11B</xref>). Sequencing depth had a negligible effect on the correlation values (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 12</xref>). Variability of ERCC expression, based on normalized total read numbers (100,000 total reads per cell), was assessed by: (1) adjusting the number of cells based on the sample with the fewest cells (random sampling of cells was applied to match the minimum number); (2) removing ERCCs with 0 reads in all cells within a sample; (3) calculating average expression levels of each of the ERCC RNAs across all cells within a sample; and (4) computing the coefficient of variation (% CV) for each ERCC RNA (standard deviation divided by the average expression level across cells within a sample). As shown in <xref ref-type="supplementary-material" rid="S8">Supplementary Figure 13</xref>, % CV was comparable between the different protocols.</p>
</sec>
<sec id="S3.SS4">
<title>DLP-scRNAseq Can Yield Sequences Spanning Entire Transcripts</title>
<p>Several lines of evidence supported the notion that our DLP-scRNAseq protocol could recover sequences spanning entire transcripts and not only terminal transcript regions. First, visual inspection of randomly selected highly expressed genes, such as the <italic>ACTB</italic> and <italic>FTL</italic> genes in <xref ref-type="fig" rid="F3">Figure 3A</xref>, showed that sequence reads mapped to all annotated exons. Second, the distribution of sequence reads along the 5&#x2032;&#x2013;3&#x2032;positions of transcript bodies was comparable between libraries that were generated from single cells and bulk populations of cells, including those that were generated using the standard rRNA depletion protocol (RNaseH) (<xref ref-type="fig" rid="F3">Figure 3B</xref>). Third, exon-level expression analysis revealed that the fractions of exons that were covered with at least one read were comparable between a pool of single cell libraries (<italic>n</italic> = 402 cells) and bulk RNAseq libraries regardless of transcript length and the 5&#x2032; or 3&#x2032; location of the exons (<xref ref-type="fig" rid="F4">Figure 4A</xref>). The exon-level expression from the pool of single-cell libraries was highly correlated with that of a bulk RNAseq library from 500 cells (Spearman correlation = 0.936) for the 333,517 exons detected in both the pool of single cell libraries and the bulk library (59% of the 562,205 total exons in the Ensembl annotation) (<xref ref-type="fig" rid="F4">Figure 4B</xref>). In addition to the commonly detected exons, 47,904 exons (from 17,704 genes) were uniquely detected in the pool of single cells and 21,429 exons (from 10,534 genes) were uniquely detected in the bulk library. The average RPKMs of the uniquely detected exons were 0.646 and 0.762 for the single-cell pool and the bulk libraries, respectively. The expression level of these uniquely detected exons was &#x223C;27-fold lower compared to the average RPKM of the exons detected in both the single-cell and bulk libraries (RPKMs of 18 and 20, respectively), indicating that highly expressed genes were detected more consistently, while the detection of less abundantly expressed genes was less robust, regardless of the method used.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>DLP-scRNAseq profiles full-length RNAs <bold>(A)</bold> A screen shot of an Integrative Genomics Viewer image of the genomic region spanning the <italic>ACTB</italic> (left) and <italic>FTL</italic> (right) genes. DLP-scRNAseq _1 is a single-cell library with a read number (710,000) representative of that obtained for other single cells (mean = 757,791 reads). Genomic location-specific read depth ranges are indicated within each plot, and the total number of reads for each library is shown between the plots. <bold>(B)</bold> Comparison of the normalized coverage of transcript bodies, from 5&#x2032; (left) to 3&#x2032; (right) of all annotated termini (3&#x2032; being the location of the polyadenylation site), achieved using DLP-scRNAseq and bulk RNAseq data. The left panel shows data from NHA cells and the right panel shows data that were generated from PBMCs. For the PBMC plot, data that were generated using the 3&#x2032;-end profiling 10&#x00D7; Chromium protocol are also shown, illustrating the 3&#x2032; end bias expected from the 10X platform.</p></caption>
<graphic xlink:href="fgene-12-665888-g003.tif"/>
</fig>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Exon level quantification of gene expression. <bold>(A)</bold> Comparisons of sensitivity of exon-level detection between DLP-scRNAseq and bulk protocols. Violin plots show the distributions of the density of the data representing various fraction of exons covered by one or more reads (<italic>Y</italic>-axis) for various ranges of transcript lengths in Ensembl annotations. Shown are data for all exonic regions (left panel), for full and partial exons falling within 5&#x2032; untranslated regions (UTRs) of transcripts (middle panel), and for full and partial exons falling within 3&#x2032; UTRs of transcripts (right panel). The coverage across coding regions of transcripts ranging in length from 200 to 5,000 nucleotides (178,348 transcripts in total) was similar between data from the DLP-scRNAseq pool of single cells and bulk libraries generated using SMARTer and RNaseH methods. Transcripts that are shorter than 200 nt (9,750 in total) showed more variable coverage, particularly at the 3&#x2032;- and 5&#x2032;-UTR regions. <bold>(B)</bold> A log-log plot of exon-level expression values comparing DLP-scRNAseq to bulk SMARTer data. Correlation values were calculated for exons with one or more reads in both datasets. The Spearman correlation was 0.93, indicating high similarity of expression of 333,517 exons. Exons captured to a higher extent with DLP-scRNAseq than SMARTer (&#x223C;459 exons, blue dots), falling below the diagonal (using the formula y&#x2013;1.28&#x00D7; &#x003C; &#x2013;5), spanned all chromosomes and mapped to 354 genes.</p></caption>
<graphic xlink:href="fgene-12-665888-g004.tif"/>
</fig>
<p>Finally, we assessed whether fusion transcripts could be detected in our data. For this analysis, we made use of previously identified UHR fusion transcripts (<xref ref-type="bibr" rid="B44">Sakarya et al., 2012</xref>; <xref ref-type="fig" rid="F5">Figure 5A</xref>). Twenty-two of these fusion transcripts were detected in UHR libraries that were generated using the bulk RNaseH protocol; of these, nine were detected using DLP-scRNAseq (<xref ref-type="fig" rid="F5">Figure 5B</xref>). The fusion events that were not detected in the DLP-scRNAseq data were of low abundance, as they were detected in the bulk data with fewer spanning reads compared to the rest of the fusion events (<xref ref-type="fig" rid="F5">Figure 5B</xref>). These data indicated that DLP-scRNAseq can capture reads that span entire transcripts, depending on the abundance of such transcripts and sequencing depth.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>DLP-scRNAseq can be used to detect fusion transcripts. <bold>(A)</bold> Reads from 62 UHR (5 pg total RNA) libraries that were generated using the DLP-scRNAseq protocol were pooled and analyzed for intergenic transcript fusion junctions, previously identified and validated using qPCR (<xref ref-type="bibr" rid="B44">Sakarya et al., 2012</xref>). Black boxes indicate events that were confirmed by <italic>de-novo</italic> transcript sequence assembly (<xref ref-type="bibr" rid="B38">Nip et al., 2019</xref>). The number on the black boxes indicate the number of contiguous reads covering the fusion transcript. The fraction of down-sampled reads is indicated in the legend (e.g., 1&#x00D7; corresponds to 250 million reads, 0.1&#x00D7; corresponds to 25 million reads). The fewest total reads corresponds to 0.4 million/cell and the highest total number of reads represents 4 million reads per cell. <bold>(B)</bold> Comparison of the sensitivity of detection of fusion transcripts between the pool of UHR libraries that were generated using DLP-scRNAseq data and data from UHR bulk libraries (100 ng total RNA) that were generated using the RNaseH protocol. The number on the black boxes indicate frequencies of detection for each fusion event.</p></caption>
<graphic xlink:href="fgene-12-665888-g005.tif"/>
</fig>
</sec>
<sec id="S3.SS5">
<title>DLP-scRNAseq Allows for the Profiling of Non-polyadenylated Transcripts</title>
<p>We evaluated the capacity of DLP-scRNAseq to profile diverse species of RNA, including those lacking polyA+ tails. We merged the sequence reads from 62 UHR libraries that were each generated from 10 pg total RNA using DLP-scRNAseq and compared the resulting proportion of RNA biotypes to those that were detected in libraries that were generated from 10 to 25 ng total UHR RNA using rRNA depletion (RNaseH) and polyA-enriched protocols, respectively. In the DLP-scRNAseq data, 85.6% of the reads were mapped to protein-coding genes and 4.3% of the reads were mapped to long intergenic non-coding RNAs (lincRNAs) (<xref ref-type="fig" rid="F7">Figure 7A</xref>). In the RNaseH-derived data, 93.8% of total number reads were mapped to protein-coding genes and 2.6% of total number reads were mapped to lincRNAs (<xref ref-type="fig" rid="F6">Figure 6A</xref>). In the data obtained using the polyA-enriched protocol, 97.5% of total number reads were mapped to protein-coding genes and only 0.95% of total number reads were mapped to lincRNAs (<xref ref-type="fig" rid="F6">Figure 6A</xref>). There was also a higher proportion (4.7%) of other non-coding RNAs such as antisense RNAs, small nuclear RNAs (snRNAs) and small nucleolar RNAs (snoRNAs) in the DLP-scRNAseq data compared to the RNaseH (0.98%) and polyA data (0.24%) (<xref ref-type="fig" rid="F6">Figure 6A</xref>), which is consistent with the notion that our protocol can be used to profile a range of RNA biotypes.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>Demonstration of the capacity of DLP-scRNAseq to capture both polyadenylated and non-polyadenylated RNAs. <bold>(A)</bold> Detection of various RNA biotypes. The proportion of various classes of detected transcripts is shown for a pool of single cell libraries generated using DLP-scRNAseq and for bulk libraries that were generated using the SMARTer and RNaseH protocols. Total UHR RNA was used as input. <bold>(B)</bold> Detection of histone mRNAs. The proportion of histone transcripts is shown for a pool of single cell libraries generated using DLP-scRNAseq and for bulk libraries that were generated using the SMARTer and RNaseH protocols. Total UHR RNA was used as input. <bold>(C)</bold> Detection and quantification of polyA<sup>&#x2013;</sup> RNAs in scRNAseq data and bulk RNAseq data from NHA cells. Pearson correlations between expression profiles generated by DLP-scRNAseq or SMARTer and expression values of genes whose expression was enriched in polyA<sup>&#x2013;</sup> and polyA<sup>+</sup> fractions are shown.</p></caption>
<graphic xlink:href="fgene-12-665888-g006.tif"/>
</fig>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>Classification of PBMC cell types based on expression profiles that were generated using DLP-scRNAseq. <bold>(A)</bold> tSNE plot with DLP-scRNAseq cells colored by cluster. <bold>(B)</bold> tSNE plots with cells colored by normalized expression of the indicated marker gene. <bold>(C)</bold> Proportions of cells identified as the indicated cell types in the DLP-scRNAseq and 10X PBMC datasets. <bold>(D)</bold> Heatmap showing proportion of all possible event pairs that were found to be alternatively spliced between indicated cell types. The number of cells assigned to each cell type is indicated on the right: the total number of possible event pairs was calculated by (# of cell type 1 cells &#x00D7; # of cell type 2 cells &#x00D7; total number of transcripts tested). Absolute numbers of AS events between cell type pairs are also shown on the heatmap. <bold>(E)</bold> Example of a cell type-specific AS event (<italic>HIPK3</italic>, BRIE transcript ID ENSG00000110422.7.AS2). Left: sashimi plots showing read densities (in RPKM) within pools of cells assigned to the same cell type. Junction reads linking exons are also indicated with lines and labeled by their count. The outside exons are exons 3 (left) and 4 (right) in most Gencode v19 <italic>HIPK3</italic> transcripts (16 exons total in ENST00000525975.1, ENST00000379016.3, and ENST00000456517.1; 17 exons total in ENST00000303296.4); the middle exon, which is more frequently retained in dendritic cells compared to the other cell types shown, is specific to transcript ENST00000534262.1 (exon 2 of 4). Right: posterior distributions (blue curve, histogram in black) learned by BRIE for each cell type. Red bar depicts the mean, and the 95% confidence interval is indicated by dashed lines. The posterior (&#x03A8;) is a measure of the frequency of exon inclusion (0&#x2013;never; 1&#x2013;always).</p></caption>
<graphic xlink:href="fgene-12-665888-g007.tif"/>
</fig>
<p>Non-coding RNAs, including lincRNAs, may be polyadenylated (<xref ref-type="bibr" rid="B42">Ravasi et al., 2006</xref>) while histone mRNAs are among those lacking polyA tails (<xref ref-type="bibr" rid="B34">Marzluff et al., 2008</xref>). We evaluated the proportion of histone mRNAs in the UHR DLP-scRNAseq, RNaseH and polyA-enriched libraries described above. There were eight and ninefold enrichments of histone mRNAs in the DLP-scRNAseq and RNaseH libraries, respectively, compared to the polyA-enriched library (<xref ref-type="fig" rid="F6">Figure 6B</xref>), indicating that these protocols effectively capture histone transcripts lacking polyA tails.</p>
<p><xref ref-type="bibr" rid="B53">Yang et al. (2011)</xref> previously identified 278&#x2013;324 transcripts that were enriched in polyA<sup>&#x2013;</sup> fractions in two different human cell lines. Approximately 95% of these transcripts were detected in our DLP-scRNAseq data from 402 pooled NHA cells. We compared the gene-level expression of these transcripts in our data from pooled NHA cells to those that were reported from the polyA<sup>&#x2013;</sup> fraction in <xref ref-type="bibr" rid="B53">Yang et al. (2011)</xref> and found the Pearson expression correlations to be 0.80 and 0.86 when compared to the values from the two cell lines; <xref ref-type="fig" rid="F6">Figure 6C</xref>). The corresponding values for the bulk SMARTer protocol were 0.83 and 0.89, respectively. In contrast, Pearson correlations using values from the polyA<sup>+</sup> fraction were lower (0.06 and 0.33 for DLP-scRNAseq and 0.07 and 0.32 for bulk SMARTer; <xref ref-type="fig" rid="F6">Figure 6C</xref>), which likely reflects background noise consistent with the transcripts being not polyadenylated.</p>
<p>Next, we examined whether DLP-scRNA could detect enhancer RNAs (eRNAs), which represent a class of non-polyadenylated nuclear RNAs (<xref ref-type="bibr" rid="B29">Lam et al., 2014</xref>). To do so, we used a previously described approach (<xref ref-type="bibr" rid="B23">Hayashi et al., 2018</xref>) that leveraged genomic coordinates from the GENCODE and CAGE FANTOM databases. First, we performed comparative analysis of eRNAs for the single-cell protocols described above, namely SMARTer, SMART_V4, exome, RNaseH (RBD), and modified RBD, using 10 ng UHR total RNA input and a normalized number of total reads (10 million). As expected, the exome approach resulted in negligible levels of eRNAs and the polyA-based SMART_V4 similarly showed minimal eRNA levels (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 14A</xref>). The SMARTer protocol, which underpins our single cell protocol, displayed the highest sensitivity of eRNA detection at a level comparable to that of the modified rRNA depletion protocol (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 14A</xref>). Using a comparable number of NHA cells and normalized number of total reads (80 million), the pooled data generated using our DLP-scRNAseq protocol showed a comparable level of eRNA detection relative to that of the bulk SMARTer protocol (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 14B</xref>).</p>
<p>Circular RNAs (cRNAs) are another class of non-polyadenylated RNAs. Using a recently reported approach (<xref ref-type="bibr" rid="B54">Zhang et al., 2020</xref>), we compared the protocols described above using varying input amounts (0.1&#x2013;10 ng) of UHR total RNA. This analysis showed that the SMARTer protocol displayed &#x003E; 4-fold higher cRNA levels compared to the other protocols. The exome and SMART_4 approaches resulted in the lowest cRNA recovery (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 15A</xref>). <xref ref-type="supplementary-material" rid="S8">Supplementary Figure 15B</xref> shows that DLP-scRNAseq identified &#x223C;50% of the cRNAs that were detected using the bulk SMARTer protocol from a comparable number of NHA cells. Taken together, these data indicate that DLP-scRNAseq can be used to profile both polyA<sup>+</sup> and polyA<sup>&#x2013;</sup> transcripts.</p>
</sec>
<sec id="S3.SS6">
<title>DLP-scRNAseq Enables Cell Type Classification Using a Biologically Heterogeneous Sample</title>
<p>To assess the capacity of the DLP-scRNAseq protocol to discern cell types from a biologically complex sample, we processed cryopreserved human peripheral blood mononuclear cells (PBMCs) using DLP-scRNAseq. Of the libraries from 518 cells that were sequenced on one-third of a HiSeq 2500 lane (188 million reads), 473 libraries had &#x003E; 100,000 reads with an average of 383,812 reads per cell. The average number of genes detected per cell was 2,830 (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 16</xref>).</p>
<p>To identify distinct cell types, we first performed clustering analysis on the expression profile of the PBMCs, identifying nine clusters (<xref ref-type="fig" rid="F7">Figure 7A</xref>). Examination of genes that marked the expression of each cluster (<xref ref-type="supplementary-material" rid="S8">Supplementary Table 2</xref>) revealed the anticipated cell types at expected ratios (<xref ref-type="bibr" rid="B26">Kleiveland, 2015</xref>), namely T cells [clusters 4, 5, and 7 (&#x223C;57%)], collectively marked by expression of <italic>IL7R</italic> (<xref ref-type="bibr" rid="B10">Carrette and Surh, 2012</xref>) and the T cell surface glycoproteins <italic>CD5</italic> and <italic>CD6</italic> (<xref ref-type="bibr" rid="B18">Gon&#x00E7;alves et al., 2018</xref>); B cells [cluster 1 (&#x223C;6%)], enriched for expression of the B cell receptor signaling molecule <italic>MS4A1</italic> (<xref ref-type="bibr" rid="B41">Polyak et al., 2008</xref>); CD14+ (cluster 2) and CD16+ (cluster 6) monocytes (<xref ref-type="bibr" rid="B57">Ziegler-Heitbrock et al., 2010</xref>) (&#x223C;18%); natural killer cells [cluster 9 (&#x223C;7%)], enriched for markers such as <italic>KLRF1</italic>(<xref ref-type="bibr" rid="B36">Moretta et al., 2003</xref>) and <italic>KLRD1</italic>(<xref ref-type="bibr" rid="B4">Borrego et al., 2005</xref>); and dendritic cells [cluster 8 (&#x223C;4%)], marked by high expression of <italic>CD74</italic> and <italic>FCER1A</italic> (<xref ref-type="bibr" rid="B19">Greer et al., 2014</xref>; <xref ref-type="fig" rid="F7">Figure 7B</xref>). Within the T cell clusters, cells in clusters 4 and 7 (&#x223C;60% of T cells) expressed <italic>CD4</italic>, whereas cluster 5 (&#x223C;40% of T cells) was enriched in cells expressing <italic>CD8A</italic>. Cells in cluster 3 were not enriched for cell type-specific markers (FDR &#x003C; 0.05). However, closer examination of QC measures revealed that this population had a high proportion of reads aligned to ERCCs (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 17A</xref>), indicating that these may have been poorer quality libraries that were not filtered using standard QC methods.</p>
<p>To analyze a comparable dataset produced using a different platform, we also obtained data from 1,223 PBMCs profiled using the 10X Genomics Chromium platform<sup><xref ref-type="fn" rid="footnote6">6</xref></sup>. Our clustering analysis also identified nine clusters for this dataset which displayed similar expression patterns to those found in the DLP-scRNAseq dataset: cell clusters 2, 5, and 6 (44% of cells) expressed markers of T cells such as <italic>IL7R</italic>, cluster 4 (&#x223C;16%) was enriched for expression of the B cell marker <italic>MS4A1</italic>, cells in cluster 9 expressed the NK cell marker <italic>KLF1</italic>, clusters 3 (&#x223C;26%) and 7 (&#x223C;3%) appeared to be composed of CD14<sup>+</sup> and CD16<sup>+</sup> monocytes, respectively, and cells in cluster 1 (&#x223C;5%) displayed high expression of <italic>CD74</italic> and <italic>FCER1A</italic>, indicating that they were likely dendritic cells (<xref ref-type="supplementary-material" rid="S8">Supplementary Figures 17B,C</xref> and <xref ref-type="supplementary-material" rid="S8">Supplementary Table 2</xref>). Similar to our observations for the PBMC dataset obtained using DLP-scRNAseq, cells in cluster 8 were not characterized by a pattern of marker gene expression that was clearly indicative of a cell type, and this cluster appeared to be composed of lower-quality cells as evidenced by its high proportion of read counts assigned to mitochondrial genes (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 17D</xref>). Overall, the cell type proportions identified in the DLP-scRNAseq and 10X datasets were comparable (<xref ref-type="fig" rid="F7">Figure 7C</xref>) despite some differences that can also be attributed to the individual source variation of the PBMC samples.</p>
<p>To determine whether DLP-scRNAseq data could be used to identify alternatively spliced (AS) transcripts, we used BRIE (<xref ref-type="bibr" rid="B24">Huang and Sanguinetti, 2017</xref>) to quantify exon inclusion events. We first performed pairwise comparisons between individual cells and, for each pair of cell types, calculated the proportion of all possible events that were identified as alternatively spliced (Bayes factor &#x2265;10; Methods). Pairs of cells assigned to the same cell type consistently had a lower proportion of AS events between them than pairs of cells assigned to different cell types (<xref ref-type="fig" rid="F7">Figure 7D</xref>). Additionally, pairs of cells from similar cell types (e.g., CD4+ T-cells and CD8+ T-cells) tended to have lower proportions of AS events between them than pairs of cells assigned to more distinct cell types (e.g., B-cells and dendritic cells). These results both supported the clustering-based cell type assignments and indicated that alternative splicing events can be identified between individual cells at ratios that are consistent with expected cell type differences.</p>
<p>We next performed alternative splicing analyses comparing distinct cell types (Methods). We identified 3,008 AS events between at least two cell types (Bayes factor &#x2265;10), and from this list identified 179 cell type-specific events (example shown in <xref ref-type="fig" rid="F7">Figure 7E</xref>; full results in <xref ref-type="supplementary-material" rid="S8">Supplementary Table 3</xref>). Notably, these included events that have previously been identified: for example, <italic>BTG3</italic>, which has been found to be differentially spliced in lung cancers (<xref ref-type="bibr" rid="B12">Chen et al., 2013</xref>), appeared to be most highly expressed in T-cells and NK cells, and inclusion of exon 4 was significantly higher in CD4+ T-cells than other cell types (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 18A</xref>). Similarly, several <italic>CTSB</italic> splice variants, including one lacking exon 2, have been shown to be differentially expressed in cancer (<xref ref-type="bibr" rid="B30">Liyanage et al., 2019</xref>), and we found evidence in our dataset that CD14+ monocytes had significantly more expression of exon 2 than other cell types (<xref ref-type="supplementary-material" rid="S8">Supplementary Figure 18B</xref>). Our results thus indicate that DLP-scRNAseq can be used to study AS transcripts enriched in comparisons of cell types.</p>
<p><xref ref-type="bibr" rid="B52">Verboom et al. (2019)</xref> recently reported single-cell profiling results from the same scRNAseq (SMARTer) kit that we used here. Another study also reported on a similar protocol (<xref ref-type="bibr" rid="B25">Isakova et al., 2020</xref>). Unique contributions of our work here include: analyses revealing the ability of DLP-scRNAseq to discern cellular heterogeneity; the orthogonal validation of expression accuracy using qPCR on 1,000 genes; our comparisons to bulk total RNAseq data; and expanded analysis of full-length transcript coverage. Further, our work adapts the kit to a different automation platform of single-cell isolation and library construction that allows for the simultaneous processing of hundreds to thousands of cells, while previous protocols are limited to 96 cells per run. Our data demonstrate that our approach allows for measurements of full-length transcript expression of both polyA<sup>+</sup> and polyA<sup>&#x2013;</sup> RNAs at a single-cell resolution for hundreds to thousands of cells per run, thus providing an avenue to comprehensively study gene expression in the context of complex, heterogeneous biological samples at single-cell resolution.</p>
</sec>
</sec>
<sec id="S4">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in the NCBI Sequence Read Archive (accession <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="SRP286135">SRP286135</ext-link>).</p>
</sec>
<sec id="S5">
<title>Author Contributions</title>
<p>SH and MAM: conception. SH, RDC, VGL, LW, and MAM: writing. SH, RDC, VGL, LW, and KB: graphics. SH, RDC, VGL, LW, SP, SB, KN, and DLT: execution. SH, MB, EC, RJNC, RAM, AJM, KLM, YZ, MH, SA, SJMJ, and MAM: grant application and supervision. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> This study was funded by the Canadian Cancer Society (Grant No. 705859), the Canadian Institutes of Health Research (Grant Nos. CCP-0160390 and FDN-143288) and Genome Canada/Genome British Columbia (Grant No. 262SEQ). We gratefully acknowledge the support of the BC Cancer Foundation, the Canada Foundation for Innovation, and the Canada Research Chairs program.</p>
</fn>
</fn-group>
<ack>
<p>We are grateful for the contributions from staff at Canada&#x2019;s Michael Smith Genome Sciences Centre at BC Cancer, including staff from the Biospecimen, Quality Assurance, Library Construction (Core and Technical Development), Instrumentation, Sequencing, LIMS, Purchasing, Project Management, and Bioinformatics teams. We thank Jungeun Song and Dr. Suganthi Chittaranjan for their assistance in maintaining cell cultures and other members of the Marra lab for insightful discussions. We also thank Dr. Stephen Yip for sharing the NHA cell line.</p>
</ack>
<sec id="S8" sec-type="supplementary-material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2021.665888/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2021.665888/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="TS1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.XLSX" id="TS2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_3.XLSX" id="TS3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_4.DOCX" id="TS4" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="DS1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anders</surname> <given-names>S.</given-names></name> <name><surname>Pyl</surname> <given-names>P. T.</given-names></name> <name><surname>Huber</surname> <given-names>W.</given-names></name></person-group> (<year>2015</year>). <article-title>HTSeq&#x2013;a Python framework to work with high-throughput sequencing data.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>166</fpage>&#x2013;<lpage>169</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu638</pub-id> <pub-id pub-id-type="pmid">25260700</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aran</surname> <given-names>D.</given-names></name> <name><surname>Looney</surname> <given-names>A. P.</given-names></name> <name><surname>Liu</surname> <given-names>L.</given-names></name> <name><surname>Wu</surname> <given-names>E.</given-names></name> <name><surname>Fong</surname> <given-names>V.</given-names></name> <name><surname>Hsu</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Reference-based analysis of lung single-cell sequencing reveals a transitional profibrotic macrophage.</article-title> <source><italic>Nat. Immunol.</italic></source> <volume>20</volume> <fpage>163</fpage>&#x2013;<lpage>172</lpage>. <pub-id pub-id-type="doi">10.1038/s41590-018-0276-y</pub-id> <pub-id pub-id-type="pmid">30643263</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Balbin</surname> <given-names>O. A.</given-names></name> <name><surname>Malik</surname> <given-names>R.</given-names></name> <name><surname>Dhanasekaran</surname> <given-names>S. M.</given-names></name> <name><surname>Prensner</surname> <given-names>J. R.</given-names></name> <name><surname>Cao</surname> <given-names>X.</given-names></name> <name><surname>Wu</surname> <given-names>Y. M.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>The landscape of antisense gene expression in human cancers.</article-title> <source><italic>Genome Res.</italic></source> <volume>25</volume> <fpage>1068</fpage>&#x2013;<lpage>1079</lpage>. <pub-id pub-id-type="doi">10.1101/gr.180596.114</pub-id> <pub-id pub-id-type="pmid">26063736</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Borrego</surname> <given-names>F.</given-names></name> <name><surname>Masilamani</surname> <given-names>M.</given-names></name> <name><surname>Kabat</surname> <given-names>J.</given-names></name> <name><surname>Sanni</surname> <given-names>T. B.</given-names></name> <name><surname>Coligan</surname> <given-names>J. E.</given-names></name></person-group> (<year>2005</year>). <article-title>The cell biology of the human natural killer cell CD94/NKG2A inhibitory receptor.</article-title> <source><italic>Mol. Immunol.</italic></source> <volume>42</volume> <fpage>485</fpage>&#x2013;<lpage>488</lpage>. <pub-id pub-id-type="doi">10.1016/j.molimm.2004.07.031</pub-id> <pub-id pub-id-type="pmid">15607803</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bray</surname> <given-names>N. L.</given-names></name> <name><surname>Pimentel</surname> <given-names>H.</given-names></name> <name><surname>Melsted</surname> <given-names>P.</given-names></name> <name><surname>Pachter</surname> <given-names>L.</given-names></name></person-group> (<year>2016</year>). <article-title>Near-optimal probabilistic RNA-seq quantification.</article-title> <source><italic>Nat Biotechnol.</italic></source> <volume>34</volume> <fpage>525</fpage>&#x2013;<lpage>527</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.3519</pub-id> <pub-id pub-id-type="pmid">27043002</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bushnell</surname> <given-names>B.</given-names></name> <name><surname>Rood</surname> <given-names>J.</given-names></name> <name><surname>Singer</surname> <given-names>E.</given-names></name></person-group> (<year>2017</year>). <article-title>BBMerge - accurate paired shotgun read merging via overlap.</article-title> <source><italic>PLoS One</italic></source> <volume>12</volume>:<fpage>e0185056</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0185056</pub-id> <pub-id pub-id-type="pmid">29073143</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Butterfield</surname> <given-names>Y. S.</given-names></name> <name><surname>Kreitzman</surname> <given-names>M.</given-names></name> <name><surname>Thiessen</surname> <given-names>N.</given-names></name> <name><surname>Corbett</surname> <given-names>R. D.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Pang</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>JAGuaR: junction alignments to genome for RNA-Seq reads.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<fpage>e102398</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0102398</pub-id> <pub-id pub-id-type="pmid">25062255</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cao</surname> <given-names>J.</given-names></name> <name><surname>Packer</surname> <given-names>J. S.</given-names></name> <name><surname>Ramani</surname> <given-names>V.</given-names></name> <name><surname>Cusanovich</surname> <given-names>D. A.</given-names></name> <name><surname>Huynh</surname> <given-names>C.</given-names></name> <name><surname>Daza</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Comprehensive single-cell transcriptional profiling of a multicellular organism.</article-title> <source><italic>Science</italic></source> <volume>357</volume> <fpage>661</fpage>&#x2013;<lpage>667</lpage>. <pub-id pub-id-type="doi">10.1126/science.aam8940</pub-id> <pub-id pub-id-type="pmid">28818938</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cao</surname> <given-names>J.</given-names></name> <name><surname>Spielmann</surname> <given-names>M.</given-names></name> <name><surname>Qiu</surname> <given-names>X.</given-names></name> <name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Ibrahim</surname> <given-names>D. M.</given-names></name> <name><surname>Hill</surname> <given-names>A. J.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>The single-cell transcriptional landscape of mammalian organogenesis.</article-title> <source><italic>Nature</italic></source> <volume>566</volume> <fpage>496</fpage>&#x2013;<lpage>502</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-019-0969-x</pub-id> <pub-id pub-id-type="pmid">30787437</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carrette</surname> <given-names>F.</given-names></name> <name><surname>Surh</surname> <given-names>C. D.</given-names></name></person-group> (<year>2012</year>). <article-title>IL-7 signaling and CD127 receptor regulation in the control of T cell homeostasis.</article-title> <source><italic>Semin. Immunol.</italic></source> <volume>24</volume> <fpage>209</fpage>&#x2013;<lpage>217</lpage>. <pub-id pub-id-type="doi">10.1016/j.smim.2012.04.010</pub-id> <pub-id pub-id-type="pmid">22551764</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>S.</given-names></name> <name><surname>Zhou</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Gu</surname> <given-names>J.</given-names></name></person-group> (<year>2018</year>). <article-title>Fastp: an ultra-fast all-in-one FASTQ preprocessor.</article-title> <source><italic>Bioinformatics</italic></source> <volume>34</volume> <fpage>i884</fpage>&#x2013;<lpage>i890</lpage>.</citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Chen</surname> <given-names>G.</given-names></name> <name><surname>Cao</surname> <given-names>X.</given-names></name> <name><surname>Zhou</surname> <given-names>Y.</given-names></name> <name><surname>Yang</surname> <given-names>T.</given-names></name> <name><surname>Wei</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Downregulation of BTG3 in non-small cell lung cancer.</article-title> <source><italic>Biochem. Biophys. Res. Commun.</italic></source> <volume>437</volume> <fpage>173</fpage>&#x2013;<lpage>178</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbrc.2013.06.062</pub-id> <pub-id pub-id-type="pmid">23810394</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cieslik</surname> <given-names>M.</given-names></name> <name><surname>Chugh</surname> <given-names>R.</given-names></name> <name><surname>Wu</surname> <given-names>Y. M.</given-names></name> <name><surname>Wu</surname> <given-names>M.</given-names></name> <name><surname>Brennan</surname> <given-names>C.</given-names></name> <name><surname>Lonigro</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>The use of exome capture RNA-seq for highly degraded RNA with application to clinical cancer sequencing.</article-title> <source><italic>Genome Res.</italic></source> <volume>25</volume> <fpage>1372</fpage>&#x2013;<lpage>1381</lpage>. <pub-id pub-id-type="doi">10.1101/gr.189621.115</pub-id> <pub-id pub-id-type="pmid">26253700</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dobin</surname> <given-names>A.</given-names></name> <name><surname>Davis</surname> <given-names>C. A.</given-names></name> <name><surname>Schlesinger</surname> <given-names>F.</given-names></name> <name><surname>Drenkow</surname> <given-names>J.</given-names></name> <name><surname>Zaleski</surname> <given-names>C.</given-names></name> <name><surname>Jha</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>STAR: ultrafast universal RNA-seq aligner.</article-title> <source><italic>Bioinformatics</italic></source> <volume>29</volume> <fpage>15</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bts635</pub-id> <pub-id pub-id-type="pmid">23104886</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Durruthy-Durruthy</surname> <given-names>R.</given-names></name> <name><surname>Ray</surname> <given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>Using Fluidigm C1 to generate single-cell full-length cDNA libraries for mRNA sequencing.</article-title> <source><italic>Methods Mol. Biol.</italic></source> <volume>1706</volume> <fpage>199</fpage>&#x2013;<lpage>221</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-4939-7471-9_11</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><collab>External RNA Controls Consortium</collab>, (<year>2005</year>). <article-title>Proposed methods for testing and selecting the ERCC external RNA controls.</article-title> <source><italic>BMC Genom.</italic></source> <volume>6</volume>:<fpage>150</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-6-150</pub-id> <pub-id pub-id-type="pmid">16266432</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Falcao</surname> <given-names>A. M.</given-names></name> <name><surname>van Bruggen</surname> <given-names>D.</given-names></name> <name><surname>Marques</surname> <given-names>S.</given-names></name> <name><surname>Meijer</surname> <given-names>M.</given-names></name> <name><surname>J&#x00E4;kel</surname> <given-names>S.</given-names></name> <name><surname>Agirre</surname> <given-names>E.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Disease-specific oligodendrocyte lineage cells arise in multiple sclerosis.</article-title> <source><italic>Nat. Med.</italic></source> <volume>24</volume> <fpage>1837</fpage>&#x2013;<lpage>1844</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-018-0236-y</pub-id> <pub-id pub-id-type="pmid">30420755</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gon&#x00E7;alves</surname> <given-names>C. M.</given-names></name> <name><surname>Henriques</surname> <given-names>S. N.</given-names></name> <name><surname>Santos</surname> <given-names>R. F.</given-names></name> <name><surname>Carmo</surname> <given-names>A. M.</given-names></name></person-group> (<year>2018</year>). <article-title>CD6, a rheostat-type signalosome that tunes T cell activation.</article-title> <source><italic>Front. Immunol.</italic></source> <volume>9</volume>:<fpage>2994</fpage>. <pub-id pub-id-type="doi">10.3389/fimmu.2018.02994</pub-id> <pub-id pub-id-type="pmid">30619347</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Greer</surname> <given-names>A. M.</given-names></name> <name><surname>Wu</surname> <given-names>N.</given-names></name> <name><surname>Putnam</surname> <given-names>A. L.</given-names></name> <name><surname>Woodruff</surname> <given-names>P. G.</given-names></name> <name><surname>Wolters</surname> <given-names>P.</given-names></name> <name><surname>Kinet</surname> <given-names>J.-P.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Serum IgE clearance is facilitated by human Fc&#x0152;&#x03BC;RI internalization.</article-title> <source><italic>J. Clin. Invest.</italic></source> <volume>124</volume> <fpage>1187</fpage>&#x2013;<lpage>1198</lpage>.</citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haile</surname> <given-names>S.</given-names></name> <name><surname>Corbett</surname> <given-names>R. D.</given-names></name> <name><surname>Bilobram</surname> <given-names>S.</given-names></name> <name><surname>Mungall</surname> <given-names>K.</given-names></name> <name><surname>Grande</surname> <given-names>B. M.</given-names></name> <name><surname>Kirk</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Evaluation of protocols for rRNA depletion-based RNA sequencing of nanogram inputs of mammalian total RNA.</article-title> <source><italic>PLoS One</italic></source> <volume>14</volume>:<fpage>e0224578</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0224578</pub-id> <pub-id pub-id-type="pmid">31671154</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haile</surname> <given-names>S.</given-names></name> <name><surname>Corbett</surname> <given-names>R. D.</given-names></name> <name><surname>MacLeod</surname> <given-names>T.</given-names></name> <name><surname>Bilobram</surname> <given-names>B.</given-names></name> <name><surname>Smailus</surname> <given-names>D.</given-names></name> <name><surname>Tsao</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2017a</year>). <article-title>Increasing quality, throughput and speed of sample preparation for strand-specific messenger RNA sequencing.</article-title> <source><italic>BMC Genom.</italic></source> <volume>18</volume>:<fpage>515</fpage>.</citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haile</surname> <given-names>S.</given-names></name> <name><surname>Pandoh</surname> <given-names>P.</given-names></name> <name><surname>McDonald</surname> <given-names>H.</given-names></name> <name><surname>Corbett</surname> <given-names>R. D.</given-names></name> <name><surname>Tsao</surname> <given-names>P.</given-names></name> <name><surname>Kirk</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2017b</year>). <article-title>Automated high throughput nucleic acid purification from formalin-fixed paraffin-embedded tissue samples for next generation sequence analysis.</article-title> <source><italic>PLoS One</italic></source> <volume>12</volume>:<fpage>e0178706</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0178706</pub-id> <pub-id pub-id-type="pmid">28570594</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hayashi</surname> <given-names>T.</given-names></name> <name><surname>Ozaki</surname> <given-names>H.</given-names></name> <name><surname>Sasagawa</surname> <given-names>Y.</given-names></name> <name><surname>Umeda</surname> <given-names>M.</given-names></name> <name><surname>Danno</surname> <given-names>H.</given-names></name> <name><surname>Nikaido</surname> <given-names>I.</given-names></name></person-group> (<year>2018</year>). <article-title>Single-cell full-length total RNA sequencing uncovers dynamics of recursive splicing and enhancer RNAs.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>9</volume>:<fpage>619</fpage>.</citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Sanguinetti</surname> <given-names>G.</given-names></name></person-group> (<year>2017</year>). <article-title>BRIE: transcriptome-wide splicing quantification in single cells.</article-title> <source><italic>Genome Biol.</italic></source> <volume>18</volume>:<fpage>123</fpage>.</citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Isakova</surname> <given-names>A.</given-names></name> <name><surname>Neff</surname> <given-names>N.</given-names></name> <name><surname>Quake</surname> <given-names>S. R.</given-names></name></person-group> (<year>2020</year>). <article-title>Single cell profiling of total RNA using Smart-seq-total.</article-title> <source><italic>bioRxiv</italic></source> [Preprint]. <pub-id pub-id-type="doi">10.1101/2020.06.02.131060</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kleiveland</surname> <given-names>C. R.</given-names></name></person-group> (<year>2015</year>). &#x201C;<article-title>Peripheral blood mononuclear cells. the impact of food bioactives on health</article-title>,&#x201D; in <source><italic>Vitro and Ex Vivo Models</italic></source>, <role>eds</role> <person-group person-group-type="editor"><name><surname>Verhoeckx</surname> <given-names>K.</given-names></name> <name><surname>Cotter</surname> <given-names>P.</given-names></name> <name><surname>&#x00F3;pez-Exp&#x00F3;sito</surname> <given-names>I. L.</given-names></name> <name><surname>Kleiveland</surname> <given-names>C.</given-names></name> <name><surname>Lea</surname> <given-names>T.</given-names></name> <name><surname>Mackie</surname> <given-names>A.</given-names></name><etal/></person-group> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name>), <fpage>161</fpage>&#x2013;<lpage>167</lpage>.</citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kolodziejczyk</surname> <given-names>A. A.</given-names></name> <name><surname>Kim</surname> <given-names>J. K.</given-names></name> <name><surname>Svensson</surname> <given-names>V.</given-names></name> <name><surname>Marioni</surname> <given-names>J. C.</given-names></name> <name><surname>Teichmann</surname> <given-names>S. A.</given-names></name></person-group> (<year>2015</year>). <article-title>The technology and biology of single-cell RNA sequencing.</article-title> <source><italic>Mol. Cell</italic></source> <volume>58</volume> <fpage>610</fpage>&#x2013;<lpage>620</lpage>.</citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Laks</surname> <given-names>E.</given-names></name> <name><surname>McPherson</surname> <given-names>A.</given-names></name> <name><surname>Zahn</surname> <given-names>H.</given-names></name> <name><surname>Lai</surname> <given-names>D.</given-names></name> <name><surname>Steif</surname> <given-names>A.</given-names></name> <name><surname>Brimhall</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Clonal decomposition and DNA replication states defined by scaled single-cell genome sequencing.</article-title> <source><italic>Cell</italic></source> <volume>179</volume> <fpage>1207</fpage>&#x2013;<lpage>1221</lpage>.</citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lam</surname> <given-names>M. T. Y.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Rosenfeld</surname> <given-names>M. G.</given-names></name> <name><surname>Glass</surname> <given-names>C. K.</given-names></name></person-group> (<year>2014</year>). <article-title>Enhancer RNAs and regulated transcriptional programs.</article-title> <source><italic>Trends Biochem. Sci.</italic></source> <volume>39</volume> <fpage>170</fpage>&#x2013;<lpage>182</lpage>. <pub-id pub-id-type="doi">10.1016/j.tibs.2014.02.007</pub-id> <pub-id pub-id-type="pmid">24674738</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liyanage</surname> <given-names>C.</given-names></name> <name><surname>Fernando</surname> <given-names>A.</given-names></name> <name><surname>Batra</surname> <given-names>J.</given-names></name></person-group> (<year>2019</year>). <article-title>Differential roles of protease isoforms in the tumor microenvironment.</article-title> <source><italic>Cancer Metast. Rev.</italic></source> <volume>38</volume> <fpage>389</fpage>&#x2013;<lpage>415</lpage>.</citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lun</surname> <given-names>A. T.</given-names></name> <name><surname>Bach</surname> <given-names>K.</given-names></name> <name><surname>Marioni</surname> <given-names>J. C.</given-names></name></person-group> (<year>2016</year>). <article-title>Pooling across cells to normalize single-cell RNA sequencing data with many zero counts.</article-title> <source><italic>Genome Biol.</italic></source> <volume>17</volume>:<fpage>75</fpage>.</citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lun</surname> <given-names>A. T. L.</given-names></name> <name><surname>McCarthy</surname> <given-names>D. J.</given-names></name> <name><surname>Marioni</surname> <given-names>J. C.</given-names></name></person-group> (<year>2016</year>). <article-title>A step-by-step workflow for low-level analysis of single-cell RNA-seq data with bioconductor.</article-title> <source><italic>F1000Research</italic></source> <volume>5</volume>:<fpage>2122</fpage>.</citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>MAQC Consortium, Shi</surname> <given-names>L.</given-names></name> <name><surname>Reid</surname> <given-names>L. H.</given-names></name> <name><surname>Jones</surname> <given-names>W. D.</given-names></name> <name><surname>Shippy</surname> <given-names>R.</given-names></name> <name><surname>Warrington</surname> <given-names>J. A.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>The MicroArray quality control (MAQC) project shows inter- and intraplatform reproducibility of gene expression measurements.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>24</volume> <fpage>1151</fpage>&#x2013;<lpage>1161</lpage>.</citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Marzluff</surname> <given-names>W. F.</given-names></name> <name><surname>Wagner</surname> <given-names>E. J.</given-names></name> <name><surname>Duronio</surname> <given-names>R. J.</given-names></name></person-group> (<year>2008</year>). <article-title>Metabolism and regulation of canonical histone mRNAs: life without a poly(A) tail.</article-title> <source><italic>Nat. Rev. Genet.</italic></source> <volume>9</volume> <fpage>843</fpage>&#x2013;<lpage>854</lpage>.</citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mills</surname> <given-names>J. D.</given-names></name> <name><surname>Kawahara</surname> <given-names>Y.</given-names></name> <name><surname>Janitz</surname> <given-names>M.</given-names></name></person-group> (<year>2013</year>). <article-title>Strand-specific RNA-Seq provides greater resolution of Transcriptome profiling.</article-title> <source><italic>Curr. Genom.</italic></source> <volume>14</volume> <fpage>173</fpage>&#x2013;<lpage>181</lpage>. <pub-id pub-id-type="doi">10.2174/1389202911314030003</pub-id> <pub-id pub-id-type="pmid">24179440</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moretta</surname> <given-names>A.</given-names></name> <name><surname>Bottino</surname> <given-names>C.</given-names></name> <name><surname>Vitale</surname> <given-names>M.</given-names></name> <name><surname>Pende</surname> <given-names>D.</given-names></name> <name><surname>Cantoni</surname> <given-names>C.</given-names></name> <name><surname>Mingari</surname> <given-names>M. C.</given-names></name><etal/></person-group> (<year>2003</year>). <article-title>Activating receptors and coreceptors involved in human natural killer cell-mediated cytolysis.</article-title> <source><italic>Annu. Rev. Immunol.</italic></source> <volume>19</volume> <fpage>197</fpage>&#x2013;<lpage>223</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.immunol.19.1.197</pub-id> <pub-id pub-id-type="pmid">11244035</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Newman</surname> <given-names>A. M.</given-names></name> <name><surname>Liu</surname> <given-names>C. L.</given-names></name> <name><surname>Green</surname> <given-names>M. R.</given-names></name> <name><surname>Gentles</surname> <given-names>A. J.</given-names></name> <name><surname>Feng</surname> <given-names>W.</given-names></name> <name><surname>Xu</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Robust enumeration of cell subsets from tissue expression profiles.</article-title> <source><italic>Nat. Methods</italic></source> <volume>12</volume> <fpage>453</fpage>&#x2013;<lpage>457</lpage>.</citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nip</surname> <given-names>K. M.</given-names></name> <name><surname>Chiu</surname> <given-names>R.</given-names></name> <name><surname>Yang</surname> <given-names>C.</given-names></name> <name><surname>Chu</surname> <given-names>J.</given-names></name> <name><surname>Mohamadi</surname> <given-names>H.</given-names></name> <name><surname>Warren</surname> <given-names>R. L.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>RNA-Bloom provides lightweight reference-free transcriptome assembly for single cells.</article-title> <source><italic>bioRxiv</italic></source> [Preprint]. <pub-id pub-id-type="doi">10.1101/701607</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pertea</surname> <given-names>M.</given-names></name> <name><surname>Pertea</surname> <given-names>G. M.</given-names></name> <name><surname>Antonescu</surname> <given-names>C. M.</given-names></name> <name><surname>Chang</surname> <given-names>T. C.</given-names></name> <name><surname>Mendell</surname> <given-names>J. T.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2015</year>). <article-title>StringTie enables improved reconstruction of a transcriptome from RNA-seq reads.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>33</volume> <fpage>290</fpage>&#x2013;<lpage>295</lpage>.</citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Picelli</surname> <given-names>S.</given-names></name> <name><surname>Bj&#x00F6;rklund</surname> <given-names>&#x00C5;K.</given-names></name> <name><surname>Faridani</surname> <given-names>O. R.</given-names></name> <name><surname>Sagasser</surname> <given-names>S.</given-names></name> <name><surname>Winberg</surname> <given-names>G.</given-names></name> <name><surname>Sandberg</surname> <given-names>R.</given-names></name></person-group> (<year>2013</year>). <article-title>Smart-seq2 for sensitive full-length transcriptome profiling in single cells.</article-title> <source><italic>Nat. Methods</italic></source> <volume>10</volume> <fpage>1096</fpage>&#x2013;<lpage>1098</lpage>.</citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Polyak</surname> <given-names>M. J.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Shariat</surname> <given-names>N.</given-names></name> <name><surname>Deans</surname> <given-names>J. P.</given-names></name></person-group> (<year>2008</year>). <article-title>CD20 homo-oligomers physically associate with the B cell antigen receptor. Dissociation upon receptor engagement and recruitment of phosphoproteins and calmodulin-binding proteins.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>283</volume> <fpage>18545</fpage>&#x2013;<lpage>18552</lpage>.</citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ravasi</surname> <given-names>T.</given-names></name> <name><surname>Suzuki</surname> <given-names>H.</given-names></name> <name><surname>Pang</surname> <given-names>K. C.</given-names></name> <name><surname>Katayama</surname> <given-names>S.</given-names></name> <name><surname>Furuno</surname> <given-names>M.</given-names></name> <name><surname>Okunishi</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>Experimental validation of the regulated expression of large numbers of non-coding RNAs from the mouse genome.</article-title> <source><italic>Genome Res.</italic></source> <volume>16</volume> <fpage>11</fpage>&#x2013;<lpage>19</lpage>.</citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reid</surname> <given-names>A. J.</given-names></name> <name><surname>Talman</surname> <given-names>A. M.</given-names></name> <name><surname>Bennett</surname> <given-names>H. M.</given-names></name> <name><surname>Gomes</surname> <given-names>A. R.</given-names></name> <name><surname>Sanders</surname> <given-names>M. J.</given-names></name> <name><surname>Illingworth</surname> <given-names>C. J. R.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Single-cell RNA-seq reveals hidden transcriptional variation in malaria parasites.</article-title> <source><italic>eLife</italic></source> <volume>7</volume>:<fpage>e33105</fpage>.</citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sakarya</surname> <given-names>O.</given-names></name> <name><surname>Breu</surname> <given-names>H.</given-names></name> <name><surname>Radovich</surname> <given-names>M.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>Y. N.</given-names></name> <name><surname>Barbacioru</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>RNA-Seq mapping and detection of gene fusions with a suffix array algorithm.</article-title> <source><italic>PLoS Comput. Biol.</italic></source> <volume>8</volume>:<fpage>e1002464</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1002464</pub-id> <pub-id pub-id-type="pmid">22496636</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Scialdone</surname> <given-names>A.</given-names></name> <name><surname>Tanaka</surname> <given-names>Y.</given-names></name> <name><surname>Jawaid</surname> <given-names>W.</given-names></name> <name><surname>Moignard</surname> <given-names>V.</given-names></name> <name><surname>Wilson</surname> <given-names>N. K.</given-names></name> <name><surname>Macaulay</surname> <given-names>I. C.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Resolving early mesoderm diversification through single-cell expression profiling.</article-title> <source><italic>Nature</italic></source> <volume>535</volume> <fpage>289</fpage>&#x2013;<lpage>293</lpage>.</citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sigurgeirsson</surname> <given-names>B.</given-names></name> <name><surname>Emanuelsson</surname> <given-names>O.</given-names></name> <name><surname>Lundeberg</surname> <given-names>J.</given-names></name></person-group> (<year>2014</year>). <article-title>Analysis of stranded information using an automated procedure for strand specific RNA sequencing.</article-title> <source><italic>BMC Genom.</italic></source> <volume>15</volume>:<fpage>631</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-15-631</pub-id> <pub-id pub-id-type="pmid">25070246</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sonoda</surname> <given-names>Y.</given-names></name> <name><surname>Ozawa</surname> <given-names>T.</given-names></name> <name><surname>Hirose</surname> <given-names>Y.</given-names></name> <name><surname>Aldape</surname> <given-names>K. D.</given-names></name> <name><surname>McMahon</surname> <given-names>M.</given-names></name> <name><surname>Berger</surname> <given-names>M. S.</given-names></name><etal/></person-group> (<year>2001</year>). <article-title>Formation of intracranial tumors by genetically modified human astrocytes defines four pathways critical in the development of human Anaplastic astrocytoma.</article-title> <source><italic>Cancer Res.</italic></source> <volume>61</volume> <fpage>4956</fpage>&#x2013;<lpage>4960</lpage>.</citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Svensson</surname> <given-names>V.</given-names></name> <name><surname>Natarajan</surname> <given-names>K. N.</given-names></name> <name><surname>Ly</surname> <given-names>L. H.</given-names></name> <name><surname>Miragaia</surname> <given-names>R. J.</given-names></name> <name><surname>Labalette</surname> <given-names>C.</given-names></name> <name><surname>Iain</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Power analysis of single-cell RNA-sequencing experiments.</article-title> <source><italic>Nat. Methods</italic></source> <volume>14</volume> <fpage>381</fpage>&#x2013;<lpage>387</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4220</pub-id> <pub-id pub-id-type="pmid">28263961</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname> <given-names>F.</given-names></name> <name><surname>Barbacioru</surname> <given-names>C.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Nordman</surname> <given-names>E.</given-names></name> <name><surname>Lee</surname> <given-names>C.</given-names></name> <name><surname>Xu</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>mRNA-Seq whole-transcriptome analysis of a single cell.</article-title> <source><italic>Nat. Methods</italic></source> <volume>6</volume> <fpage>377</fpage>&#x2013;<lpage>382</lpage>.</citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tarasov</surname> <given-names>A.</given-names></name> <name><surname>Vilella</surname> <given-names>A. J.</given-names></name> <name><surname>Cuppen</surname> <given-names>E.</given-names></name> <name><surname>Nijman</surname> <given-names>I. J.</given-names></name> <name><surname>Prins</surname> <given-names>P.</given-names></name></person-group> (<year>2015</year>). <article-title>Sambamba: fast processing of NGS alignment formats.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>2032</fpage>&#x2013;<lpage>2034</lpage>.</citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tirosh</surname> <given-names>I.</given-names></name> <name><surname>Izar</surname> <given-names>B.</given-names></name> <name><surname>Prakadan</surname> <given-names>S. M.</given-names></name> <name><surname>Wadsworth</surname> <given-names>M. H.</given-names></name> <name><surname>Treacy</surname> <given-names>D.</given-names></name> <name><surname>Trombetta</surname> <given-names>J. J.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Dissecting the multicellular ecosystem of metastatic melanoma by single-cell RNA-seq.</article-title> <source><italic>Science</italic></source> <volume>352</volume> <fpage>189</fpage>&#x2013;<lpage>196</lpage>.</citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Verboom</surname> <given-names>K.</given-names></name> <name><surname>Everaert</surname> <given-names>C.</given-names></name> <name><surname>Bolduc</surname> <given-names>N.</given-names></name> <name><surname>Livak</surname> <given-names>K. J.</given-names></name> <name><surname>Yigit</surname> <given-names>N.</given-names></name> <name><surname>Rombaut</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>SMARTer single cell total RNA sequencing.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>47</volume>:<fpage>e93</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz535</pub-id> <pub-id pub-id-type="pmid">31216024</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>L.</given-names></name> <name><surname>Duff</surname> <given-names>M. O.</given-names></name> <name><surname>Graveley</surname> <given-names>B. R.</given-names></name> <name><surname>Carmichael</surname> <given-names>G. G.</given-names></name> <name><surname>Chen</surname> <given-names>L. L.</given-names></name></person-group> (<year>2011</year>). <article-title>Genome wide characterization of non-polyadenylated RNAs.</article-title> <source><italic>Genome Biol.</italic></source> <volume>12</volume>:<fpage>R16</fpage>. <pub-id pub-id-type="doi">10.1186/gb-2011-12-2-r16</pub-id> <pub-id pub-id-type="pmid">21324177</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>S.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name> <name><surname>Zhao</surname> <given-names>F.</given-names></name></person-group> (<year>2020</year>). <article-title>Accurate quantification of circular RNAs identifies extensive circular isoform switching events.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>1</volume>:<fpage>90</fpage>.</citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>S.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Gordon</surname> <given-names>W.</given-names></name> <name><surname>Quan</surname> <given-names>J.</given-names></name> <name><surname>Xi</surname> <given-names>H.</given-names></name> <name><surname>Du</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Comparison of stranded and non-stranded RNA-seq transcriptome profiling and investigation of gene overlap.</article-title> <source><italic>BMC Genom.</italic></source> <volume>16</volume>:<fpage>675</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-015-1876-7</pub-id> <pub-id pub-id-type="pmid">26334759</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ziegenhain</surname> <given-names>C.</given-names></name> <name><surname>Vieth</surname> <given-names>B.</given-names></name> <name><surname>Parekh</surname> <given-names>S.</given-names></name> <name><surname>Reinius</surname> <given-names>B.</given-names></name> <name><surname>Guillaumet-Adkins</surname> <given-names>A.</given-names></name> <name><surname>Smets</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Comparative analysis of single-cell RNA sequencing methods.</article-title> <source><italic>Mol. Cell</italic></source> <volume>65</volume> <fpage>631</fpage>&#x2013;<lpage>643</lpage>.</citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ziegler-Heitbrock</surname> <given-names>L.</given-names></name> <name><surname>Ancuta</surname> <given-names>P.</given-names></name> <name><surname>Crowe</surname> <given-names>S.</given-names></name> <name><surname>Dalod</surname> <given-names>M.</given-names></name> <name><surname>Grau</surname> <given-names>V.</given-names></name> <name><surname>Hart</surname> <given-names>D. N.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Nomenclature of monocytes and dendritic cells in blood.</article-title> <source><italic>Blood</italic></source> <volume>116</volume>:<fpage>e0074-80</fpage>.</citation></ref>
</ref-list><fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="https://support.10xgenomics.com/single-cell-gene-expression/datasets/3.0.0/pbmc_1k_v3">https://support.10xgenomics.com/single-cell-gene-expression/datasets/3.0.0/pbmc_1k_v3</ext-link></p></fn>
<fn id="footnote2">
<label>2</label>
<p><ext-link ext-link-type="uri" xlink:href="http://cf.10xgenomics.com/supp/cell-exp/refdata-cellranger-hg19-3.0.0.tar.gz">http://cf.10xgenomics.com/supp/cell-exp/refdata-cellranger-hg19-3.0.0.tar.gz</ext-link></p></fn>
<fn id="footnote3">
<label>3</label>
<p><ext-link ext-link-type="uri" xlink:href="https://sourceforge.net/projects/brie-rna/files/annotation/">https://sourceforge.net/projects/brie-rna/files/annotation/</ext-link></p></fn>
<fn id="footnote4">
<label>4</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/huangyh09/briekit">https://github.com/huangyh09/briekit</ext-link></p></fn>
<fn id="footnote5">
<label>5</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/lh3/seqtk">https://github.com/lh3/seqtk</ext-link></p></fn>
<fn id="footnote6">
<label>6</label>
<p><ext-link ext-link-type="uri" xlink:href="https://support.10xgenomics.com/single-cell-gene-expression/datasets/3.0.0/pbmc_1k_v3">https://support.10xgenomics.com/single-cell-gene-expression/datasets/3.0.0/pbmc_1k_v3</ext-link></p></fn>
</fn-group>
</back>
</article>