<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">894597</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2022.894597</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Integration of Single-Cell Transcriptomics With a High Throughput Functional Screening Assay to Resolve Cell Type, Growth Kinetics, and Stemness Heterogeneity Within the Comma-1D Cell Line</article-title>
<alt-title alt-title-type="left-running-head">Dave et al.</alt-title>
<alt-title alt-title-type="right-running-head">Single-Cell Characterization of Comma-1D Heterogeneity</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Dave</surname>
<given-names>Arpit</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1714041/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Nekritz</surname>
<given-names>Erin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Charytonowicz</surname>
<given-names>Daniel</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Beaumont</surname>
<given-names>Michael</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Smith</surname>
<given-names>Melissa</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1765234/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Beaumont</surname>
<given-names>Kristin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1148478/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Silva</surname>
<given-names>Jose</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Sebra</surname>
<given-names>Robert</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/392997/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Genetics and Genomic Sciences</institution>, <institution>Icahn School of Medicine at Mount Sinai</institution>, <addr-line>New York</addr-line>, <addr-line>NY</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Pathology</institution>, <institution>Icahn School of Medicine at Mount Sinai Hospital</institution>, <addr-line>New York</addr-line>, <addr-line>NY</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Icahn Genomics Institute</institution>, <institution>Icahn School of Medicine at Mount Sinai</institution>, <addr-line>New York</addr-line>, <addr-line>NY</addr-line>, <country>United States</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Biochemistry and Molecular Genetics</institution>, <institution>University of Louisville</institution>, <addr-line>Louisville</addr-line>, <addr-line>KY</addr-line>, <country>United States</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Black Family Stem Cell Institute</institution>, <institution>Icahn School of Medicine at Mount Sinai</institution>, <addr-line>New York</addr-line>, <addr-line>NY</addr-line>, <country>United States</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Center for Advanced Genomics Technology</institution>, <institution>Icahn School of Medicine at Mount Sinai</institution>, <addr-line>New York</addr-line>, <addr-line>NY</addr-line>, <country>United States</country>
</aff>
<aff id="aff7">
<sup>7</sup>
<institution>Sema4</institution>, <institution>A Mount Sinai Venture</institution>, <addr-line>Stamford</addr-line>, <addr-line>CT</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/28953/overview">H. Steven Wiley</ext-link>, Pacific Northwest National Laboratory (DOE), United States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1044847/overview">Travis Steele Johnson</ext-link>, Indiana University Bloomington, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/782868/overview">Sushmita Roy</ext-link>, University of Wisconsin-Madison, United States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Robert Sebra, <email>Robert.sebra@mssm.edu</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Genomic Assay Technology, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>14</day>
<month>06</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<elocation-id>894597</elocation-id>
<history>
<date date-type="received">
<day>11</day>
<month>03</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>05</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Dave, Nekritz, Charytonowicz, Beaumont, Smith, Beaumont, Silva and Sebra.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Dave, Nekritz, Charytonowicz, Beaumont, Smith, Beaumont, Silva and Sebra</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Cell lines are one of the most frequently implemented model systems in life sciences research as they provide reproducible high throughput testing. Differentiation of cell cultures varies by line and, in some cases, can result in functional modifications within a population. Although research is increasingly dependent on these <italic>in vitro</italic> model systems, the heterogeneity within cell lines has not been thoroughly investigated. Here, we have leveraged high throughput single-cell assays to investigate the Comma-1D mouse cell line that is known to differentiate in culture. Using scRNASeq and custom single-cell phenotype assays, we resolve the clonal heterogeneity within the referenced cell line on the genomic and functional level. We performed a cohesive analysis of the transcriptome of 5,195 sequenced cells, of which 85.3% of the total reads successfully mapped to the mm10-3.0.0 reference genome. Across multiple gene expression analysis pipelines, both luminal and myoepithelial lineages were observed. Deep differential gene expression analysis revealed eight subclusters identified as luminal progenitor, luminal differentiated, myoepithelial differentiated, and fibroblast subpopulations&#x2014;suggesting functional clustering within each lineage. Gene expression of published mammary stem cell (MaSC) markers Epcam, Cd49f, and Sca-1 was detected across the population, with 116 (2.23%) sequenced cells expressing all three markers. To gain insight into functional heterogeneity, cells with patterned MaSC marker expression were isolated and phenotypically investigated through a custom single-cell high throughput assay. The comparison of growth kinetics demonstrates functional heterogeneity within each cell cluster while also illustrating significant limitations in current cell isolation methods. We outlined the upstream use of our novel automated cell identification platform&#x2014;to be used prior to single-cell culture&#x2014;for reduced cell stress and improved rare cell identification and capture. Through compounding single-cell pipelines, we better reveal the heterogeneity within Comma-1D to identify subpopulations with specific functional characteristics.</p>
</abstract>
<kwd-group>
<kwd>scRNASeq</kwd>
<kwd>Mammary Development</kwd>
<kwd>Comma-1D</kwd>
<kwd>Mouse Cell Line</kwd>
<kwd>Functional Assay</kwd>
<kwd>High throughput</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>In most mammalian females, the mammary gland consists of branching ducts surrounded by adipose tissue. The ducts comprise three layers: basement membrane, basal cells, and luminal cells outlined in <xref ref-type="fig" rid="F1">Figure 1A</xref> (<xref ref-type="bibr" rid="B38">Malhotra et al., 2010</xref>; <xref ref-type="bibr" rid="B27">Kondov et al., 2018</xref>). The basal cell contracture assists milk transport through the ducts toward the skin surface. The luminal cells line the inside of the ducts, and the alveolar cell lineage secretes milk during pregnancy. Within normal development, the ducts branch throughout the breast, and adipose is the predominant tissue. Details of mammary gland development across developmental time points have been extensively studied (<xref ref-type="bibr" rid="B19">Hens and Wysolmerski, 2005</xref>; <xref ref-type="bibr" rid="B3">Anderson et al., 2007</xref>). Over the course of pregnancy, prolactin and progesterone trigger drastic branching and invasion of ducts along with lobuloalveolar units to maximize lactational competency. This tissue remodeling also involves environmental reorganization for supporting development, including vascularization to support growth, lipid loss in adipocytes for spatial restructuring, and enlargement of the liver for addressing increased energy needs (<xref ref-type="bibr" rid="B51">Petitti and Perlman, 1988</xref>). There is evidence highlighting the pathogenesis of breast cancer mirroring the functional pathways identified for mammary gland development during pregnancy. Mechanisms such as reduced cell apoptosis, increased cell proliferation, and extracellular matrix modification reflect alterations in oncogenesis and pregnancy (<xref ref-type="bibr" rid="B61">Slepicka et al., 2019</xref>). Therefore, model systems that can simulate properties specific to healthy mammary gland function have the potential to serve as a proxy for better understanding of breast cancer disease pathogenesis.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Background on mammary duct biology and an introduction of scRNASeq pipeline. <bold>(A)</bold> Model of mammary duct cross-section and potential cell types, including tumor initiation. <bold>(B)</bold> A framework of the experimental pipeline to investigate sample heterogeneity with improved resolution and throughput. The illustrations were generated on <ext-link ext-link-type="uri" xlink:href="http://Biorender.com">Biorender.com</ext-link> <bold>(C)</bold> Violin plots for percent of genes mapping to mitochondrial genome, the total number of molecules detected within a cell, and the number of unique genes detected in each cell. Each data point represents a unique barcode from a bead. Filtered violin plots for cells with the percent of genes mapping to mitochondrial genome less than 20%, the number of unique features detected in each cell greater than 2,000, and a nCount less than 45,000. <bold>(D)</bold> Elbow plot outlining the standard deviation/variance in the data set attributed to each principal component. Kinks in the curve can highlight the distinction between relevant and noise PCs.</p>
</caption>
<graphic xlink:href="fgene-13-894597-g001.tif"/>
</fig>
<p>Characterization of breast cancer is often leveraged to classify patients into disease pathways based on surface receptor expression of Estrogen receptor (ER), Progesterone receptor (PR), and Human epidermal growth factor receptor 2 (HER2). As higher resolution assays reveal marker expression attributed to subpopulations within a tumor, the granularity of disease classifications has been modified to reflect this new information (<xref ref-type="bibr" rid="B32">Lehmann et al., 2016</xref>). Novel gene vectors within a population have also been shown to provide information on proliferative capacity, migration tendency, stemness capability, and treatment targets (<xref ref-type="bibr" rid="B21">Jiang et al., 2021</xref>; <xref ref-type="bibr" rid="B77">Xu et al., 2021</xref>). Further investigations into breast cancer have previously yielded fundamental marker discoveries including <italic>Mki67</italic>
<sup>&#x2b;</sup> as a prognostic marker, <italic>Cd44</italic>
<sup>&#x2b;</sup>/<italic>Cd24</italic>
<sup>&#x2b;</sup> as a breast cancer stem cell marker, and <italic>Trop2</italic> as another therapeutic target (<xref ref-type="bibr" rid="B57">Ricardo et al., 2011</xref>; <xref ref-type="bibr" rid="B75">Xiong et al., 2019</xref>; <xref ref-type="bibr" rid="B35">Liu et al., 2021</xref>). Gene vectors also assist cell type deconvolution and functional prediction with markers such as epithelial cell adhesion molecule (<italic>Epcam</italic>), actin alpha 2 (<italic>Acta2</italic>), and collagen type 1 alpha two chain (<italic>Col1a2</italic>) expressed significantly in luminal, myoepithelial, and fibroblast cell types, respectively (<xref ref-type="bibr" rid="B52">Prater et al., 2014</xref>; <xref ref-type="bibr" rid="B69">Visvader and Stingl, 2014</xref>; <xref ref-type="bibr" rid="B42">Muhl et al., 2020</xref>). Epcam further serves as a marker for stemness and functions in cellular migration (<xref ref-type="bibr" rid="B16">Gaiser et al., 2012</xref>). Understanding the expression patterns of functional gene vectors in model systems ultimately allows for improved stratification of study systems and informed cell line selection in legacy investigations.</p>
<p>The Comma-1D cell line was derived from BALB/c mouse mammary epithelium and is known to functionally differentiate to preneoplastic and neoplastic phenotypes <italic>in vitro</italic> (<xref ref-type="bibr" rid="B12">Danielson et al., 1984</xref>). Cell lines traditionally serve as a high throughput model system to understand normal and oncogenic characteristics. Cell line models differ in their degree of homogeneity, with commonly investigated breast cancer lines such as MCF7 indicating biological differences between labs (<xref ref-type="bibr" rid="B48">Osborne et al., 1987</xref>). We chose to characterize Comma-1D using single-cell methods to underscore this model line for its known differentiation in culture as a demonstration to highlight the efficacy and resolution of this suite of methods. Moreover, the identification of subpopulations demonstrating stem-like gene expression followed by phenotypic assays to define differentiation capacity resulted in the development of multiple robust pipelines for model generation and characterization. The differential gene expression analysis (DGEA) analysis provided a framework to identify clusters based on transcriptomic and predicted genomic alterations. These clusters may have identifiable functional traits that can be observed and quantified. For example, cell motility is an increasing trait of interest in oncology (<xref ref-type="bibr" rid="B67">Twigger et al., 2015</xref>). With this pipeline, we can identify motile gene expression across the population through scRNASeq followed by high throughput single-cell fluorescence quantification of migratory proteins.</p>
<p>The advent of high throughput single-cell processing platforms has allowed for the deep characterization of known and novel cell subpopulations. Further, these assays have been employed to define tumor heterogeneity and investigate tumor microenvironment across disease subtypes and locations (<xref ref-type="bibr" rid="B50">Paul et al., 2017</xref>). However, single-cell technologies have not yet been leveraged to characterize many model systems, including Comma-1D, as many cell lines have been assumed to be homogenous and well defined based on findings from bulk sequence data. Consortiums such as The Cancer Genome Atlas provide conventional bulk RNA and DNA methylation for cell lines, which serve as a necessary foundation for any preliminary testing using these model systems (<xref ref-type="bibr" rid="B54">Ren et al., 2018</xref>). As our understanding of the complexity of cancer evolves, the resolution of data needed to provide an accurate framework for therapy targets needs to approach a single-cell level. By determining populations of functional variability, we generate a spectrum of subclonal populations, which can be ordered by predicted role in disease progression, role in tumor population heterogeneity, and downstream effect by successful therapeutic targeting. We present here an optimized high throughput method for single-cell genomic analysis for population identification to inform downstream phenotypic and functional experimentation (<xref ref-type="fig" rid="F1">Figure 1B</xref>
<bold>)</bold>. This method identified four novel populations of interest and enabled an 80.4% increase in microfluidic cell cultures populated with the <italic>Epcam</italic>
<sup>
<italic>&#x2b;</italic>
</sup>
<italic>Cd49f</italic>
<sup>
<italic>high</italic>
</sup>
<italic>Sca-1</italic>
<sup>
<italic>high</italic>
</sup>, stem-like cell type.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and Methods</title>
<sec id="s2-1">
<title>Comma-1D Mouse Mammary Epithelial Culture</title>
<p>The Comma-1D cell line was provided by the Gregory Hannon Laboratory (Cancer Research United Kingdom, Cambridge Institute). Aliquots were thawed and then cultured in CytoOne T25 flasks (US Scientific) with culture media composing DMEM/F-12 media (Thermo Fisher), 2% FBS (Sigma-Aldrich), 1% Pen-Strep (Gibco), 10&#xa0;&#x3bc;g/ml Insulin (Sigma-Aldrich), and 5&#xa0;ng/ml Epidermal Growth Factor (Thermo Fisher). Upon 80% confluency, the sample was passaged following the recommended subculturing protocol for adherent cells (<xref ref-type="bibr" rid="B8">Cancer Genome Atlas Research et al., 2013</xref>).</p>
</sec>
<sec id="s2-2">
<title>Single-Cell RNA Sequencing and Library Prep</title>
<p>For single-cell RNA sequencing, cells were collected at passage five and suspended in 1x PBS media at 1 &#xd7; 10<sup>6</sup> cells/ml. Cells were processed according to Chromium 3&#x27; Gene Expression V3 Kit (10X Genomics) using the manufacturer&#x2019;s guidelines followed by sequencing on an S1 NovaSeq chip (Illumina Inc.). Qubit 3 (Fisher Scientific) and 2100 Bioanalyzer (Agilent) were used for quality check of cDNA. The output BAM file from sequencing was processed through 10X Genomics Cell Ranger software v3.1.0. The outputted read counts matrix inputs into R for downstream analysis such as Seurat and Monocle.</p>
<p>Single-cell gene expression data resolves unique heterogeneity information not attainable from conventional bulk sequencing technologies (<xref ref-type="bibr" rid="B56">Ricardo and Phelan, 2008</xref>). To evaluate the heterogeneity in the Comma-1D cell line, we ran the cells through the pipeline and successfully generated scRNASeq data with &#x223c;50,000 2 &#xd7; 150&#xa0;bp reads per cell with 5,745 cells sequenced, generating 238&#xa0;M reads with 98% valid barcodes and 100% valid UMIs. 85.3% of the total reads mapped to the mm10-3.0.0 reference genome.</p>
</sec>
<sec id="s2-3">
<title>ScRNASeq Comma-1D Data Filtering and Analysis</title>
<p>To advance computational accuracy and remove predicted outlier data, the Seurat object representing the cells from the Comma-1D line was filtered for features that were not present in at least 15 cells (&#x223c;0.3% of total cell count) (<xref ref-type="bibr" rid="B81">Zheng et al., 2017</xref>). To further clean the data set, data points were filtered using three parameters: high percent mitochondrial data is indicative of cell death, therefore cells with &#x3e;20% were removed; a high count of unique features &#x3e; 45,000 are indicative of multiplets and ribosomal RNA (rRNA) in the gel emulsion (GEM) formation and were therefore removed; a low count of unique features &#x3c;2000 is also indicative of GEMs with no cells or debris, and these cells were also removed from the dataset (<xref ref-type="bibr" rid="B62">Svensson et al., 2017</xref>; <xref ref-type="bibr" rid="B7">Butler et al., 2018</xref>; <xref ref-type="bibr" rid="B15">Freytag et al., 1000</xref>). <xref ref-type="fig" rid="F1">Figure 1C</xref> represents the data pre- and post-sub-setting for the above-mentioned quality standards, respectively, with 5,195 of the 5,745 sequenced cells passing these QC parameters. After passing the initial QC, the data was normalized to account for variability. Cell cycle scoring was done to mitigate cell cycle heterogeneity through phase scoring of G2/M and S markers, which were then regressed out (<xref ref-type="bibr" rid="B24">Kimmerling et al., 2018</xref>). PCA was conducted for dimensionality reduction to identify undefined components that constitute variability within the data, plotted in <xref ref-type="fig" rid="F1">Figure 1D</xref>. The PCA scores were used by Seurat to generate unsupervised clusters. The Seurat object with filtered and labeled data was then utilized by the Monocle pipeline for pseudo-time analysis. Data is imported through Monocle through extracting and expression matrix, cell metadata, and gene annotations from the Seurat object. The new cell data set is reprocessed and standardized through the preprocess_cds() function. The cell dataset it reclustered with the louvain_iter set to one, nearest neighbor k value set to 150, and a UMAP-based dimensionality reduction. Top genes from the Seurat clusters are leveraged as markers to annotate the Monocle generate populations.</p>
</sec>
<sec id="s2-4">
<title>Integration of Comma-1D and Mouse Mammary Dataset</title>
<p>To better understand the functional populations predicted in Comma-1D, the dataset was integrated with previously published scRNASeq mouse mammary data from a C57BL/6 mouse (<xref ref-type="bibr" rid="B49">Pal et al., 2021</xref>). C57BL/6 is a widely used strain commonly utilized for developmental biology and therefore served as a good selection for comparison with Comma-1D. For functional comparison, the adult C57BL/6 mammary tissue dataset was downloaded from the GEO database (GSE164307) and integrated with the Comma-1D scRNASeq data. The dataset was imported and preprocessed with the same pipeline described for Comma-1D. Cells were filtered for identifiers with over 800 features, less than 20,000 total counts, and less than 20 percent mitochondrial gene activity. This dataset was independently normalized and scaled prior to data integration. The C57BL/6 mouse mammary dataset provided 11,997 total cells post-filtering. Harmony is a data integration algorithm that encourages cell grouping by cell type rather than dataset biased metrics by accounting for experimental variability and was used for the integration of these data (<xref ref-type="bibr" rid="B28">Korsunsky et al., 2019</xref>). As done for the Comma-1D dataset independently, the Harmony merged dataset was processed for global unsupervised clustering using FindNeighbors() and FindClusters(), with a resolution value of 0.5. Clusters were analyzed using the FindAllMarkers() function and gene markers used to identify partitioning Comma-1D were replotted for the merged dataset using feature plots.</p>
</sec>
<sec id="s2-5">
<title>Ranked Stemness Prediction Using Entropy Scoring of Comma-1D Clusters</title>
<p>To estimate the differentiation potency (i.e., stemness) of single cells, we leveraged a computationally accelerated calculation of transcriptional Shannon entropy, following work pioneered by Tessechndorf and Enver (<xref ref-type="bibr" rid="B64">Teschendorff and Enver, 2017</xref>). Conceptually, differentiation of a cell involves the progressive silencing of gene pathways unrelated to its increasingly specialized function, such that the promiscuity seen in transcriptional activity decreases as a cell differentiates. Conversely, stem-like cells retain a higher degree of overall transcriptional activity across a multitude of pathways governing potential fates. This dynamic can be leveraged to estimate the degree of differentiation of a single cell, through calculating the Shannon entropy rate of a random-walk across a protein-protein interaction (PPI) network with gene expression superimposed.</p>
<p>We implemented entropy estimation using the abovementioned approach in Tensorflow 2.0 with support for GPU accelerated calculation. Prior to entropy scoring, unnormalized raw cell counts were subject to light kNN smoothing (<italic>k</italic> &#x3d; 8) to reduce technical variance in entropy scores induced by gene dropout and subsequently renormalized to 10,000 counts per cell. Entropy scoring on smoothed, depth-normalized count data was performed on a Google Cloud VM n1-highmem-16 instance running on an NVIDIA Tesla T4 GPU with 16&#xa0;GB RAM. After calculating entropy scores, unsmoothed, depth-normalized counts were used to calculate spearman correlations for all genes with respect to entropy score. Significance values were adjusted to account for multiple testing correction using the benjamini-hochberg false discovery rate method. Genes with positive spearman correlation are overexpressed in stem-like cells, while genes with negative spearman correlation are overexpressed in differentiated cells.</p>
</sec>
<sec id="s2-6">
<title>Subpopulation Tracking and Stemness Evaluation With Beacon</title>
<p>Cells were harvested from culture at passage five and suspended in Comma-1D culture media at an ideal loading concentration of 2 &#xd7; 10<sup>6</sup>&#xa0;cells/ml. Utilizing the small volume import parameters on Beacon, 5&#xa0;&#xb5;l of media with cells were bubble imported into the microfluidic chip at 25&#xb0;C. OptoElectroPositioning (OEP) was used to identify, isolate, and pen both independent cells and clusters of cells into isolated nanopens. Cells were loaded with a voltage of 2.1&#xa0;V at 5&#xa0;&#x3bc;m/s, with a target of 1&#x2013;4 cells per pen. This import and culture method has previously been utilized for cellular characterization (<xref ref-type="bibr" rid="B5">Beaumont et al., 2022</xref>). Over multiple iterations of this importing and culture, levels of Matrigel (Corning) were optimized to allow cell adherence on the chip surface while also providing an isolated nanopen network for 3-dimensional growth. The cells are cultured on chip with DMEM/F-12 media (Thermo Fisher), 2% FBS (Sigma-Aldrich), 1% Pen-Strep (Gibco), 10&#xa0;&#x3bc;g/ml Insulin (Sigma-Aldrich), and 5&#xa0;ng/ml Endothelial Growth Factor (Thermo Fisher) at 37&#xb0;C with 5% CO<sub>2</sub>. The microfluidics on-chip allow constant perfusion of media which is perfused at 0.01&#xa0;&#x3bc;l/s. Fresh media refills is provided to the system every 24&#xa0;h. Cells were cultured up to 10&#xa0;days post-import.</p>
<p>All nanopens and their cellular contents were imaged in 12-h and 24-h intervals comprising every imaging channel on the Beacon system (OEP, DAPI, FITC, Texas Red, or Cy5). Pseudobinning was performed with differential expression of fluorescence of antibodies EpCAM-Cy5 (Biolegend &#x23;118220), EpCAM-AF594 (Cell Signaling Technology &#x23;73195), CD49f-FITC (Biolegend &#x23;313606), and Sca-1-BV421 (Biolegend &#x23;108127). The images were then collated and analyzed on a custom MATLAB (MathWorks) script. Images captured across timepoints and channels are aligned through the microfluidic chip&#x2019;s feature points. Each nano pen is designed with a region of interest (ROI) for coordinate-based image comparison between timepoints and imaging channels. Cells are identified through a circle detection algorithm that then filters possible cell locations by image intensity readings under the brightfield (OEP) channel. True positive cell locations are saved on a 3-dimensional matrix of coordinates. Each ROI and each cell location are measured for fluorescent intensity across channels at t<sub>0</sub>. These values are normalized by dividing cell location measurements by that cell&#x2019;s ROI measurement. This normalization permits multi-chip comparison and scoring. The normalized image intensity readings are clustered based on populational heterogeneity identified from single-cell sequencing data. The cell intensity readout is binned into the generated clusters allowing for high throughput post-import cellular subtype identification.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>Resolving Subpopulation Heterogeneity Within Comma-1D With Single-Cell Transcriptomics</title>
<p>We generated eight unique subpopulations from unsupervised clustering of our Comma-1D cell line culture sample. Principal Component Analysis (PCA) is useful for fast and linear dimensionality reduction, however with increasingly complex data affiliated with scRNASeq, UMAP is another preferred network analysis tool that preserves the global structure, distance correlations, and continuity of cell states (<xref ref-type="bibr" rid="B74">Xiang et al., 2021</xref>). <xref ref-type="fig" rid="F2">Figure 2A</xref> shows a UMAP plot of the heterogeneity of the evident subgroups. Using the filtered, normalized, and scaled dataset, cell line clustering provided an increased resolution to gene expression and clonal population differences. Investigating differential gene expression between clusters within this dataset, we further highlight potential functional clustering. While one dataset was generated and processed for scRNASeq of the Comma-1D cell line, the throughput of 5,195 cells provides confidence in characterizing the observed heterogeneity. Datasets were generated for functional validation using Beacon data across 1,214 cells from two individual chips to demonstrate technical validity. All <italic>p</italic>-values are reported for each differentially expressed gene (DEG) analysis; however, due to the throughput of this assay and a high n count, <italic>p</italic>-values are close to 0 with values less than 2.225074e-308 reported as 0 by R. <xref ref-type="fig" rid="F2">Figure 2B</xref> and <xref ref-type="sec" rid="s9">Supplementary Figure S1</xref> are cluster trees outlining distance relationships between the generated subgroups, with <xref ref-type="sec" rid="s9">Supplementary Figure S1</xref> indicating nodal identifiers for downstream analysis and reference. This phylogenetic tree analysis averages data points across an identified subpopulation to extrapolate distance relationships between the identified clusters. Top differentially expressed genes driving the node splits in the population are outlined in <xref ref-type="sec" rid="s9">Supplementary Table S1</xref>. These gene vectors generate hits relevant to interpreting functional identities of these populations, such as <italic>Lcn2</italic> (<italic>p</italic> &#x3d; 0) and <italic>Col6a1</italic> (<italic>p</italic> &#x3d; 0). From the cluster tree and UMAP in <xref ref-type="fig" rid="F2">Figure 2</xref>, we visualize specific populations as more distant from the remaining cells, primarily clusters attributed to fibroblasts. To investigate the functional hallmarks of these populations, we explored all markers expressed in each cluster and sorted them by the difference of pct.1 and pct.2, which represent the percent of cells in a specific cluster expressing a gene and the percent of cells outside that cluster expressing that gene, respectively. Typically, we have identified that genes with difference values greater than 0.5 are responsible for providing the most direct representation of individual cluster states and that these genes, in most cases, parallel the most significant DEGs with regards to <italic>p</italic>-value and avg_logFC. Through sorting by this difference value, we derive gene expression sets increasingly specific to the subpopulation of interest (<xref ref-type="bibr" rid="B44">Newman et al., 2015</xref>). This analysis was run across all the generated clusters; resultant data is shown in <xref ref-type="sec" rid="s9">Supplementary Figure S2</xref>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Comma-1D preliminary cluster analysis. <bold>(A)</bold> The UMAP depicts unsupervised clusters across the population with a resolution parameter of 0.5. <bold>(B)</bold> Cluster tree generated by averaging data points across a cluster and deriving distance relationships between the identified populations on a pseudo-bulk level. <bold>(C)</bold> The heatmap outlines the expression of the top five DEGs within each cluster if they pass the significance threshold.</p>
</caption>
<graphic xlink:href="fgene-13-894597-g002.tif"/>
</fig>
<p>The top five differentially expressed genes per cluster that pass a baseline significance criterion are shown on the heatmap in <xref ref-type="fig" rid="F2">Figure 2C</xref>. These top differentially expressed genes were parsed to identify the potential cell types as labeled. The top five genes in the cluster predicted as fibroblast are <italic>Col6a1</italic> (<italic>p</italic> &#x3d; 0), <italic>Col3a1</italic> (<italic>p</italic> &#x3d; 0), <italic>Col6a2</italic> (<italic>p</italic> &#x3d; 0), <italic>Gng11</italic> (<italic>p</italic> &#x3d; 0), and <italic>Pdgfrb</italic> (<italic>p</italic> &#x3d; 0). These genes highlight invasion in the Comma-1D population as part of the diversity of collagen genes typical of fibroblast cells (<xref ref-type="bibr" rid="B47">Olsen et al., 1989</xref>). Previous studies have also found fibroblasts in Comma-1D cell line culture (<xref ref-type="bibr" rid="B12">Danielson et al., 1984</xref>). Further evidence supporting the presence of a fibroblast population in Comma-1D is highlighted in <xref ref-type="fig" rid="F3">Figure 3A</xref> by the feature plots generated across typical canonical markers of fibroblastic cells. The fibroblast cluster is significant in its isolated expression of <italic>Col3a1</italic> (<italic>p</italic> &#x3d; 0), while also expressing the <italic>Vimentin</italic> (<italic>Vim</italic>, <italic>p</italic> &#x3d; 1.34e-154), <italic>S100a4</italic> (<italic>p</italic> &#x3d; 3.06e-164), and <italic>Cola2</italic> (<italic>p</italic> &#x3d; 0) at a higher intensity than the remaining populations. Violin plots shown in <xref ref-type="fig" rid="F3">Figure 3B</xref> quantify the observed differential expression amongst the genes highlighted above.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Predicting cell types and functions by cluster. <bold>(A)</bold> Feature plots of key canonical markers of fibroblastic cells <bold>(B)</bold> Violin plots of key canonical markers of fibroblastic cells. Identified fibroblast cluster exclusively expressed all markers. <bold>(C)</bold> Feature plots depicting expression of markers derivative of luminal and myoepithelial subtypes, EPCAM and ACTA2, respectively. <bold>(D)</bold> Violin plots outlining distinct expression of Krt18 expression within the luminal subtypes indicating possible alveolar cell function. Krt8 expression was significantly isolated to the predicted luminal progenitor population within the luminal subtype. Almost exclusive expression of Krt8 indicates luminal progenitor cluster as a progenitor population within luminal cells and with luminal 1 as slightly differentiated cells with secretory/alveolar function. <bold>(E)</bold> Differential genes between the two clusters in the luminal partition. <bold>(F)</bold> Differential genes within the local myoepithelial partition. <bold>(G)</bold> Ridge plot of gene markers conserved within luminal cells, but not expressed significantly outside the luminal population. <bold>(H)</bold> Ridge plot of gene markers conserved within myoepithelial cells, but not expressed significantly outside the myoepithelial population.</p>
</caption>
<graphic xlink:href="fgene-13-894597-g003.tif"/>
</fig>
<p>This pipeline was applied in parallel to the additional clusters identified in the Comma-1D culture. Through these analyses, we identified the remaining functional groups composing the Comma-1D culture population. <xref ref-type="bibr" rid="B67">Twigger et al. (2015)</xref> identified key gene markers that functionally determine mammary gland cell populations, including two main types of epithelial cells, determined to be luminal and myoepithelial cells. <xref ref-type="fig" rid="F3">Figure 3C</xref> shows increased gene expression of <italic>Epcam</italic> (<italic>p</italic> &#x3d; 0) and <italic>Acta2</italic> (<italic>p</italic> &#x3d; 0) used to identify luminal and myoepithelial populations, respectively. Diving deeper into each predicted partition, within the luminal subgroup, we observed a higher-than-expected expression of <italic>Krt18</italic> (<italic>p</italic> &#x3d; 1.57e-79), a marker for the alveolar subtype of luminal mammary cells <xref ref-type="fig" rid="F3">Figure 3D</xref> (<xref ref-type="bibr" rid="B41">Moritani et al., 2015</xref>; <xref ref-type="bibr" rid="B80">Zhao et al., 2010</xref>). Much like <xref ref-type="bibr" rid="B80">Zhao et al. (2010)</xref> noted in their immortalized mammary stem/progenitor cells, we see the expression of <italic>Krt8</italic> (<italic>p</italic> &#x3d; 0) isolated to the luminal progenitor cells relative to all other cell populations, shown in <xref ref-type="fig" rid="F3">Figure 3D</xref> (<xref ref-type="bibr" rid="B34">Lichtner et al., 1991</xref>). After running a FindMarkers() function, we generate genes differentially expressed between the luminal progenitor population and luminal 1 population, with the top hits sorted by pct.difference visualized by the violin plots in <xref ref-type="fig" rid="F3">Figure 3E</xref>. From the DEGs identified in <xref ref-type="fig" rid="F3">Figure 3E</xref>, we noticed that the <italic>Krt7</italic> (<italic>p</italic> &#x3d; 1.13e-180) and <italic>Ehf</italic> (<italic>p</italic> &#x3d; 1.78e-68) expression, known to identify immature luminal epithelial cells, was isolated to the luminal progenitor cluster (<xref ref-type="bibr" rid="B22">Jones et al., 2004</xref>; <xref ref-type="bibr" rid="B30">Kumar et al., 2018</xref>).</p>
<p>Within the breast, the luminal progenitor cells differentiate into non-secretory epithelial and alveolar cell types for lactating function (<xref ref-type="bibr" rid="B6">Booth et al., 2007</xref>). The non-secretory epithelial cells are typically identified by <italic>Krt19</italic>, for which we did not observe expression within this population in our experiments. However, we did observe <italic>Krt18</italic> expression, associated with the milk-creating alveolar subtype, in the luminal progenitor cluster, as shown previously in <xref ref-type="fig" rid="F3">Figure 3D</xref>. The Violin plots in <xref ref-type="fig" rid="F3">Figure 3F</xref> identify a significant gene within each cluster compared to the local myoepithelial population. We found identifying functional differences within the myoepithelial clusters to be too assumptive based on our scRNASeq data; however, some DEGs can provide useful inferences. For example, the myoepithelial 5 population significantly expressed <italic>Aldh3a1</italic>(<italic>p</italic> &#x3d; 1.48e-157), which has been linked with increased cell proliferation and tolerance to the cytostatic and cytotoxic effects of lipidic aldehydes (<xref ref-type="bibr" rid="B43">Muzio et al., 2012</xref>). We also identified the differential genes across all the clusters within the myoepithelial cell type in the heatmap shown in <xref ref-type="sec" rid="s9">Supplementary Figure S2A</xref>. To highlight the differential expression for key markers, feature plots for a top gene per cluster is visualized in <xref ref-type="sec" rid="s9">Supplementary Figure S2B</xref>. This differential gene expression analysis can be paralleled across any two cell selections within the population.</p>
<p>Running a differential gene expression analysis between the luminal and myoepithelial partitions generates gene vectors conserved within each partition but with differential expression between the populations. <xref ref-type="table" rid="T1">Table 1</xref> lists the top genes that were differentially expressed between myoepithelial and luminal subtypes, identified by selecting the top 10 genes by the difference in the percentage of cells in each partition expression that marker. The top three DEGs are visualized on the ridge plots in <xref ref-type="fig" rid="F3">Figure 3G</xref> showcases genes conserved within luminal cell types while also demonstrating a lack of expression in the myoepithelial cells, such as <italic>Epcam</italic> (<italic>p</italic> &#x3d; 0), <italic>Wfdc2</italic> (<italic>p</italic> &#x3d; 0), and <italic>Nkd2</italic> (<italic>p</italic> &#x3d; 0). Similarly, <xref ref-type="fig" rid="F3">Figure 3H</xref> represents the top three genes conserved within myoepithelial cell types with a lack of expression in the luminal cells, such as <italic>Igfbp6</italic> (<italic>p</italic> &#x3d; 0), <italic>Lrp1</italic> (<italic>p</italic> &#x3d; 0), <italic>Fbln2</italic> (<italic>p</italic> &#x3d; 0).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Top genes differentially expressed between luminal and myoepithelial subtypes. Conserved genes in the myoepithelial and luminal partitions that are differentially expressed between the two. <italic>p</italic>-Value less than 2.23e-308 is reported as 0 by R.</p>
</caption>
<table>
<tbody>
<tr>
<td colspan="4" align="center">
<bold>Luminal conserved gene markers</bold>
</td>
</tr>
<tr>
<td align="left">
<bold>Gene</bold>
</td>
<td align="center">
<bold>Percent expression in luminal population</bold>
</td>
<td align="center">
<bold>Percent expression in myoepithelial population</bold>
</td>
<td align="center">
<bold>
<italic>p</italic>-value</bold>
</td>
</tr>
<tr>
<td align="left">Epcam</td>
<td align="center">0.917</td>
<td align="center">0.066</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Wfdc2</td>
<td align="center">0.923</td>
<td align="center">0.11</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Nkd2</td>
<td align="center">0.816</td>
<td align="center">0.061</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Krt18</td>
<td align="center">0.848</td>
<td align="center">0.11</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Lsr</td>
<td align="center">0.749</td>
<td align="center">0.021</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Cldn7</td>
<td align="center">0.733</td>
<td align="center">0.016</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Lad1</td>
<td align="center">0.789</td>
<td align="center">0.079</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Rab25</td>
<td align="center">0.671</td>
<td align="center">0.017</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Wfdc18</td>
<td align="center">0.72</td>
<td align="center">0.082</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Krt7</td>
<td align="center">0.669</td>
<td align="center">0.054</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td colspan="4" align="center">
<bold>Myoepithelial conserved gene markers</bold>
</td>
</tr>
<tr>
<td align="left">
<bold>Gene</bold>
</td>
<td align="center">
<bold>Percent expression in luminal population</bold>
</td>
<td align="center">
<bold>Percent expression in myoepithelial population</bold>
</td>
<td align="center">
<bold>
<italic>p</italic>-value</bold>
</td>
</tr>
<tr>
<td align="left">Igfbp6</td>
<td align="center">0.193</td>
<td align="center">0.888</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Lrp1</td>
<td align="center">0.208</td>
<td align="center">0.885</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Fbln2</td>
<td align="center">0.223</td>
<td align="center">0.882</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Ass1</td>
<td align="center">0.246</td>
<td align="center">0.895</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Sparc</td>
<td align="center">0.371</td>
<td align="center">0.999</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Ptges</td>
<td align="center">0.157</td>
<td align="center">0.776</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Igfbp2</td>
<td align="center">0.149</td>
<td align="center">0.766</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Pdpn</td>
<td align="center">0.186</td>
<td align="center">0.802</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Emp3</td>
<td align="center">0.372</td>
<td align="center">0.985</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
<tr>
<td align="left">Ly6e</td>
<td align="center">0.364</td>
<td align="center">0.976</td>
<td align="center">0.000000e&#x2b;00</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Each subcluster identified has unique signatures that assist in defining its local and global functionality within a heterogeneous cell line. To assist in functional predictions, top gene vectors for each subcluster, identified by significant avg_logFC value, are ported through a gseGO network analysis provided by the ClusterProfiler() package (<xref ref-type="bibr" rid="B72">Wu et al., 2021</xref>). The gene vectors are generated to compare functionality within each partition rather than global comparison, with the exception of the predicted fibroblast population. For example, the gene vector used to run the network analysis for myoepithelial 1 was generated by comparing the gene expression of that cluster to the remaining myoepithelial subclusters: myoepithelial 2, myoepithelial 3, myoepithelial 4, myoepithelial 5. These local comparisons within each partition determine differential transcripts with functional indications. All the pathway predictors and the affiliated genes for each subpopulation are visualized by the Cnet plots in <xref ref-type="sec" rid="s9">Supplementary Figure S3</xref>. For each subcluster analysis, the Cnet plots illustrate top pathway activation indicators and their respectively linked genes. The pathways identified predict functional differences in each subcluster based on known gene vectors. The myoepithelial subclusters were of interest in this analysis to parse functional granularity between clusters. Myoepithelial 1 expressed genes associated with cellular response to external stimuli, like <italic>Mt1</italic> (<italic>p</italic> &#x3d; 1.07e-100), <italic>Mt2</italic> (<italic>p</italic> &#x3d; 1.78e-179), and <italic>Bnip3</italic> (<italic>p</italic> &#x3d; 8.76e-150). The expression of <italic>Pttg1</italic> (<italic>p</italic> &#x3d; 4.95e-120) and <italic>Cdc20</italic> (<italic>p</italic> &#x3d; 1.35e-53) in myoepithelial 2 indicated pathway activation related to reproduction and cell growth. Myoepithelial 3 was defined by genes relating to gene ontology (GO) terms for cellular components and anatomy, like <italic>Cdk1</italic> (<italic>p</italic> &#x3d; 3.65e-49) and <italic>Zyx</italic> (<italic>p</italic> &#x3d; 8.46e-88). The top DEGs in myoepithelial 4 were associated with GO terms for response to wound healing and cell proliferation, including genes like <italic>Tpm1</italic> (<italic>p</italic> &#x3d; 2.15e-41), <italic>Fn1</italic> (<italic>p</italic> &#x3d; 4.31e-71), and <italic>Sparc</italic> (<italic>p</italic> &#x3d; 2.62e-100). The last population of myoepithelial cells, myoepithelial 5 was distinguished by the nucleus and intracellular organelle lumen pathways, including genes such as <italic>Hsph1</italic> (<italic>p</italic> &#x3d; 9.93e-22), <italic>Cbr3</italic> (<italic>p</italic> &#x3d; 4.57e-68), <italic>Ptges</italic> (<italic>p</italic> &#x3d; 1.48e-41), and <italic>Aldh2</italic> (<italic>p</italic> &#x3d; 2.78e-33). The myoepithelial 5 population pathways have high gene counts therefore only two pathways are visualized, whereas in the other plots top three are shown. Luminal 1 has gene enrichment of <italic>Krt17</italic> (<italic>p</italic> &#x3d; 1.31e-164), <italic>Krtdap</italic> (<italic>p</italic> &#x3d; 3.06e-216), and <italic>Krt6a</italic> (<italic>p</italic> &#x3d; 2.70e-242) linked to pathways involved in keratinization and epidermis development. The luminal progenitor population has pathway activation of protease binding and endopeptidase inhibition, indicated by the expression of genes such as <italic>Wfdc18</italic> (<italic>p</italic> &#x3d; 0) and <italic>Lcn2</italic> (<italic>p</italic> &#x3d; 0). The fibroblast population has activation of genes related to extracellular matrix (ECM) and external structure activation through gene expression of <italic>Col1a1</italic> (<italic>p</italic> &#x3d; 0), <italic>Col1a2</italic> (<italic>p</italic> &#x3d; 0), <italic>Col3a1</italic> (<italic>p</italic> &#x3d; 0), and <italic>Col6a1</italic> (<italic>p</italic> &#x3d; 0). The significance of expression is lower among the myoepithelial comparisons further indicating that the population has reduced functional heterogeneity in comparison to the two luminal clusters.</p>
</sec>
<sec id="s3-2">
<title>Subpopulation Comparison of Integrated C57BL/6 Mouse Mammary and Comma-1D Data</title>
<p>Harmony was used to compare populations between cell line and mouse mammary tissue. The merged dataset was re-normalized to reduce experimental and sample bias. The UMAP in <xref ref-type="sec" rid="s9">Supplementary Figure S4A</xref> illustrates the relationship proximity between sample types. The merged dataset was processed for unsupervised clustering which yielded ten unique subpopulations composing luminal, myoepithelial, and fibroblast partitions are shown in <xref ref-type="sec" rid="s9">Supplementary Figure S4A</xref>. The bar plot in <xref ref-type="sec" rid="s9">Supplementary Figure S4B</xref> quantifies sample contribution to each cluster. Every cluster population contains cells from both samples; however, most clusters have a preferential population to a given sample. For example, the myoepithelial 1 cluster has 1,944 total cells with 362 cells (18.62%) originating from C57BL/6 and 1,582 cells (81.38%) from Comma-1D. The populational breakdown linked with cell locations on UMAP indicates similar functional populations representative in each sample type, illustrated in <xref ref-type="sec" rid="s9">Supplementary Figure S4C</xref>. The three feature plots summarize the expression of canonical markers <italic>Col1a2</italic>, <italic>Acta2</italic>, and <italic>Epcam</italic> to identify fibroblast, myoepithelial, and luminal cell types, respectively. These partitions of cells are detected across the Comma-1D and C57BL/6 datasets. From the heatmap in <xref ref-type="sec" rid="s9">Supplementary Figure S4D</xref>, top differential genes characterizing each cluster is visualized. The merged analysis revealed two smooth muscle cell derived myoepithelial populations, indicated by the expression of canonical markers <italic>Tagln</italic> (<italic>p</italic> &#x3d; 0) and <italic>Tpm2</italic> (<italic>p</italic> &#x3d; 0). One of the luminal populations indicated ductal cell functionality with the expression of markers <italic>Csn3</italic> (<italic>p</italic> &#x3d; 0) and <italic>Wfdc18</italic> (<italic>p</italic> &#x3d; 0). This ductal specific luminal population was not previously identified by the Comma-1D independent analysis.</p>
</sec>
<sec id="s3-3">
<title>Resolving Founder Populations Through Pseudo-Time Analysis</title>
<p>The Seurat package provides a comprehensive pipeline for cluster identification and differential gene expression. As single-cell data increasingly becomes a more widespread tool for advancing the efforts of onco-genomics, more analysis platforms are providing analysis tools to parse and interpret this complex landscape. For example, the Trapnell lab has generated the Monocle 3 pipeline for pseudo-time analysis across a population at a given time point (<xref ref-type="bibr" rid="B65">Trapnell et al., 2014</xref>). Using the differential gene expression across an entire population, we can use Monocle 3 to visualize predicted nodes of origin and differentiation. We see parallel functional clustering when investigating our COMMA-1D cell line through both pipelines. Monocle reclustering generated 11 unique populations within Comma-1D. The clusters generated resemble the luminal, myoepithelial, and fibroblast transcriptomic profiles, identified previously using Seurat, outlined in <xref ref-type="fig" rid="F4">Figure 4A</xref>. The plot in <xref ref-type="fig" rid="F4">Figure 4B</xref> illustrates top gene markers from the Seurat clusters and their expression profiles within the Monocle generated populations. We identified gene expression of <italic>Col3a1</italic> (<italic>p</italic> &#x3d; 0), <italic>Epcam</italic> (<italic>p</italic> &#x3d; 0), and <italic>Acta2</italic> (<italic>p</italic> &#x3d; 2.37e-273), as predictive markers for fibroblast, luminal, and myoepithelial cells, respectively. As highlighted in <xref ref-type="fig" rid="F4">Figure 4B</xref>, the representative gene expression patterns were observed across the various partitions of Comma-1D. Therefore, we can conclude the populations created through Monocle are separating cell types similar to cell groups we defined through Seurat cluster analysis, providing independent and orthogonal validation of our approach. We can apply this association to identify functionally similar populations between the analysis pipelines. For example, <italic>Lgals7</italic> is a gene marker for luminal 1 (<italic>p</italic> &#x3d; 1.89e-109) in Seurat with differential expression in the luminal C (<italic>p</italic> &#x3d; 3.48e-12) cluster in Monocle. Similarly, <italic>Lcn2</italic> is differentially expressed in the luminal progenitor (<italic>p</italic> &#x3d; 0) cluster from Seurat with significant expression observed in luminal A (<italic>p</italic> &#x3d; 5.88e-139) in Monocle.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Pseudotime analysis of Comma-1D populations. <bold>(A)</bold> Monocle partitions and reclustering within the populations. Monocle clustering generated 11 total clusters composed of luminal, myoepithelial, and fibroblast populations. <bold>(B)</bold> Dotplot of the top four genes per cluster identified from the Seurat generated Comma-1D populations. Gene expression is plotted against Monocle generated clusters <bold>(C)</bold> Feature plots illustrating expression of cancer stem cell (CSC) markers <italic>Epcam</italic>, <italic>Itga6</italic>, <italic>Ly6a</italic>, <italic>Cd44</italic>, <italic>Cd24a</italic>, and <italic>Mki67</italic>. Significant stemness related gene markers observed in the luminal A and myoepithelial A Monocle clusters. <bold>(D)</bold> Utilizing manually selected root nodes of interest, we create a trajectory predicting population evolution. Within Partition 1, luminal C is furthest along the differentiation trajectory. The fibroblast population is most progressed along the differentiation trajectory in Partition 2 <bold>(E)</bold> Ranked entropy score by Comma-1D cluster, luminal progenitor population with most stem-like capability in this cell line. <bold>(F)</bold> UMAP plot overlaid with entropy score gradient for Seurat generated clusters.</p>
</caption>
<graphic xlink:href="fgene-13-894597-g004.tif"/>
</fig>
<p>Monocle pseudotime trajectories determine gene expression changes across the populations to place single cells along that defined trajectory. Top cancer stem cell (CSC) markers leveraged in Seurat are visualized on the Monocle UMAP in <xref ref-type="fig" rid="F4">Figure 4C</xref>. This reveals populations such as luminal A and myoepithelial A with high predicted stemness capacity. In contrast, luminal C and fibroblast clusters have reduced expression of these stemness markers. Using the DEGs between clusters identified in Seurat, we generated a Monocle trajectory plot for those genes to determine which nodes yield key expression differences. The identified and selected nodes are used to order and plot cells on a pseudotime trajectory shown in <xref ref-type="fig" rid="F4">Figure 4D</xref>. Based on the pseudotime trajectory results, we identify luminal A and myoepithelial A as populations early in the differentiation trajectory. These pseudotime findings support assumptions made from CSC marker expression. The trajectory analysis indicates luminal C and fibroblast populations as furthest along the differentiation trajectory within each partition. Based on parallel gene expression markers between analysis pipelines, this supervised pseudotime analysis further supports predictions from gene expression about the luminal progenitor population&#x2019;s stemness capability.</p>
<p>To validate the supervised findings from Monocle 3, we employed an unsupervised single-cell entropy scoring algorithm to estimate stemness within the Comma-1D clusters. Entropy scores have indicated a correlation to increased stemness capability (<xref ref-type="bibr" rid="B64">Teschendorff and Enver, 2017</xref>). This analysis confirmed the luminal progenitor cells have the highest mean entropy score, <xref ref-type="fig" rid="F4">Figure 4E</xref>. Thereby, further indicating this cluster&#x2019;s potential function as a progenitor or stem-like population within the Comma-1D cell line culture. Using this tool, we identify fibroblast cells as the population with the lowest mean entropy score. As this is the most functionally differentiated population in our dataset, the findings support both key conclusions interpreted from entropy scoring. The other six clusters represent similar entropy scores with mean scores between those generated for fibroblast and luminal progenitor clusters. <xref ref-type="fig" rid="F4">Figure 4F</xref> is the UMAP plot structure for Comma-1D overlayed with an entropy score gradient for each cell point. The plot visualizes the increased entropy within the luminal progenitor population.</p>
</sec>
<sec id="s3-4">
<title>Comparative Analysis of Novel and Known Stem-Like Markers Within Comma-1D Population</title>
<p>Recent publications have highlighted the Comma-1D line for its inclusion of populations of stem-like cells (<xref ref-type="bibr" rid="B79">Yang et al., 2017</xref>). Parsing published data for markers of stem-like cells revealed three markers of stem-like cell subpopulations, <italic>Epcam</italic>
<sup>
<italic>&#x2b;</italic>
</sup>
<italic>Cd49f</italic>
<sup>
<italic>high</italic>
</sup>
<italic>Sca-1</italic>
<sup>
<italic>high</italic>
</sup>, as well as preliminary phenotypic data supporting differentiation capability to both basal and luminal lineages (<xref ref-type="bibr" rid="B29">Krebsbach and Villa-Diaz, 2017</xref>). In addition, the expression of these markers has already been associated with disease prognosis (<xref ref-type="bibr" rid="B78">Yang et al., 2012</xref>). When searching for these markers across the cells sequenced from the Comma-1D line, we observed the differential gene expression patterns outlined in <xref ref-type="fig" rid="F5">Figure 5A</xref>. The gene equivalent for the proteins <italic>Epcam</italic>, <italic>Cd49f</italic>, and <italic>Sca-1</italic> are the gene symbols <italic>Epcam</italic>, <italic>Itga6</italic>, and <italic>Ly6a</italic>, respectively. Combinatorial expression of these three markers yields unique cell selections identified by the nomenclature elucidated in <xref ref-type="table" rid="T2">Table 2</xref>. We subset the entire Comma-1D population for cells expressing one or more genes of interest to investigate the subpopulations further. For example, to isolate a P8 subpopulation, we filtered for cells with a scaled expression for the collective gene set, <italic>Epcam</italic>
<sup>
<italic>&#x2b;</italic>
</sup>
<italic>Itga6</italic>
<sup>
<italic>high</italic>
</sup>
<italic>Ly6a</italic>
<sup>
<italic>high</italic>
</sup>, demonstrating higher than 0.3 intensity. This intensity cutoff was determined from a bimodality of expression across these genes where 0.3 was the lower bounds of the higher mode, which we believe correlates to true RNA expression, which can be visually interpreted by the violin plots in <xref ref-type="sec" rid="s9">Supplementary Figure S5</xref>. Published markers <italic>Cd44</italic>, <italic>Cd24</italic>, and <italic>Mki67</italic> have each been linked with stemness potential and were plotted for comparison against <italic>Epcam</italic>, <italic>Itga6</italic>, and <italic>Ly6a</italic> expression (<xref ref-type="bibr" rid="B57">Ricardo et al., 2011</xref>; <xref ref-type="bibr" rid="B11">Cidado et al., 2016</xref>)<italic>.</italic> These P8 filtered cells were plotted in the feature plots shown in <xref ref-type="fig" rid="F5">Figure 5B</xref> visualizing the stem gene markers of interest. The composition of this sub-selected dataset is outlined in the pie charts in <xref ref-type="fig" rid="F5">Figure 5C</xref>, where we observed cells from all clusters in the original population present in this predicted stem-like population, except for the fibroblast cluster.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Gene expression of markers identified for stemness. <bold>(A)</bold> Feature plots of <italic>Epcam</italic>, <italic>Itga6</italic>, and <italic>Ly6a</italic>, which represents for the proteins <italic>Epcam</italic>, <italic>Cd49f</italic>, and <italic>Sca-1</italic> <bold>(B)</bold> Feature plot expression of the key gene markers after filtering for cells expressing a minimal threshold of 0.3 for all markers. <bold>(C)</bold> Pie plot visualizing population broken down by cluster. Between the entire Comma-1D population and P8, there is increased occupancy of luminal 1 and myoepithelial 4 with a significant decrease of myoepithelial two and loss of the fibroblast cell population.</p>
</caption>
<graphic xlink:href="fgene-13-894597-g005.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Subpopulations of interest by identified marker expression patterns. Overview of markers selected for stemness investigation. Four subpopulations of interest were identified by expression patterns of epithelial cellular adhesion molecule, integrin subunit alpha 6, and lymphocyte antigen 6 complex locus A.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Subset</th>
<th align="center">Epcam (Epcam)</th>
<th align="center">Itga6 (Cd49f)</th>
<th align="center">Ly6a (Sca-1)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">P5</td>
<td align="center">&#x2212;</td>
<td align="center">High</td>
<td align="center">Low</td>
</tr>
<tr>
<td align="left">P6</td>
<td align="center">&#x2212;</td>
<td align="center">Low</td>
<td align="center">Low</td>
</tr>
<tr>
<td align="left">P7</td>
<td align="center">&#x2b;</td>
<td align="center">High</td>
<td align="center">Low</td>
</tr>
<tr>
<td align="left">P8</td>
<td align="center">&#x2b;</td>
<td align="center">High</td>
<td align="center">High</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-5">
<title>Custom Beacon Pipeline for Resolving Phenotypic Heterogeneity and Cell Aggregate Development</title>
<p>The data presented was collected using a microfluidic instrument that allows high throughput cellular selection and manipulation with light-induced dielectrophoresis (Berkley Lights, Inc.). The system employs disposable microfluidic chips with 3,500 nanopens allowing for isolated cell cultures. Above the experimental chip is an integrated fluorescent microscope that operates with OEP, DAPI, FITC, Texas Red, and Cy5 channels. Using this system, experimental assays are designed to quantify variables including sample heterogeneity, response to stimulus, and cell interactions. Experimental and cultural conditions need to be optimized for each sample to induce assay robustness. Incremental adjustment of Matrigel concentration, cell import concentration, and chip surface treatment were done to improve cell adhesion, increase cell growth, and reduce processing time. Through dozens of iterations, we have identified a reproducible custom protocol, which resulted in Comma-1D cell growth to cell aggregates on the Beacon platform. <xref ref-type="fig" rid="F6">Figure 6A</xref> demonstrates the Comma-1D cell line cultured under a controlled microenvironment over a 5-day culture period. Each image represents a progressive time with 24-h interval image capture of a fixed subsection of 18 nanopens on the instrument&#x2019;s microfluidic chip. We observed cell-dependent growth differences between isolated cultures, resulting in the development of a method for capturing the biological differences driving cell-to-cell growth rate differences. The colored bar below pen images indicates pens with cells that either proliferated (indicated by green) or showed signs of apoptosis (indicated by red).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Phenotypic assay overview. <bold>(A)</bold> A subsection of a beacon chip across five time points of a culture period. The bar on the bottom indicates heterogeneity in observed growth response. Red indicates dying cells, white is no significant observed response, and green is for cells with detected proliferation <bold>(B)</bold> The top graph is plotting the growth ratio across identified subpopulations. The bottom graph indicates growth differences depending on initial cell concentration. 5% error bars are visualized for each plot. <bold>(C)</bold> Sample pen images of various cells across imaging channels. The colored outline is to highlight expression (green) or lack of (red). The top row is a known P8 population imaged at three channels with expression detected for all three markers. U<sub>A</sub> and U<sub>B</sub> indicate sample images of unknown cell types with marker expression pattern resolving subtypes P8 and P5, respectively <bold>(D)</bold> Overview of MATLAB script pipeline to identify cell populations by protein expression, automating observations described in <bold>(C)</bold>. <bold>(Di)</bold> Illustrates regions of interest (ROIs) representing each nanopen. <bold>(Dii)</bold> Shows possible cell detection locations based on circle detection. <bold>(Diii)</bold> Visualizes filtered cell detections leveraging OEP fluorescence thresholds. Fluorescence intensity above 65,535 is set as the threshold for true positive cell detection. <bold>(Div)</bold> Visualizes normalized expression scores for two cell detection locations in the TRED channel. Normalized scoring accounts for variability in background fluorescence between FOVs and between experimental chips. Readings are imported into a matrix for each detected cell for each marker and channel. <bold>(Dv)</bold>A sample readout of cells subtype based on the measured expression. Numbers &#x201c;5&#x201d; and &#x201c;7&#x201d; indicate populations P5 and P7, respectively. <bold>(Dvi)</bold>A scatter plot of all the detected cells plotted based on their expression of Cd49f and Epcam and the subtype they are predicted to belong to. 88.3% of FACS sorted cells pseudo-bin to same population on-chip. Each color represents the pseudo-binned subtype for that cell, as indicated in the legend. Nanopens with multiple cells at t<sub>0</sub> are sources of noise and background fluorescence that misidentify some cells. <bold>(E)</bold> ROI images of randomly selected P8 identified cells from each imaging channel. The heatmap on the bottom compares expression across channels and cells. This functionality provides verification to the pseudo binning results, allows for clustering and threshold adjustment, and provides easy visualization for every cell subpopulation of interest.</p>
</caption>
<graphic xlink:href="fgene-13-894597-g006.tif"/>
</fig>
<p>We performed a growth analysis of both single and batches of cell subtypes from the Comma-1D population. The supervised cellular populations identified from scRNASeq (P5, P6, P7, and P8), listed above in <xref ref-type="table" rid="T2">Table 2</xref>, were translated to populations identifiable via surface marker antibody expression. The Comma-1D cell line was thawed from frozen aliquots and cultured in DME media with Fetal Bovine Serum (FBS), Pen Strep (PS), Insulin, and Endothelial Growth Factor (EGF). To isolate specific populations, fluorescence-activated cell sorting (FACS) was performed utilizing cell surface expression of markers <italic>Cd49f</italic>, <italic>Epcam</italic>, and <italic>Sca-1</italic>. These isolated cell populations were then independently imported onto the Beacon 3500 chip. Each cell is tracked by the location identifiers pinned to each nanopen, allowing for cell type-related deconvolution downstream. By tracking cell types, it allows characterization of heterogenous batch culture at <italic>t</italic> &#x3d; 0 (t<sub>0</sub>) and its effects on growth response. Cell samples from the original culture dish that were not sorted through flow cytometry were also imported onto the Beacon chip for growth analysis. Cells were cultured on-chip for 4&#xa0;days with constant perfusion of Comma-1D culture media. Using the Beacon brightfield imaging mode (OEP), time-lapse images were captured every 12&#xa0;h across the 22 Fields of View (FOV) composing the 3,500 independent nanopens, 311 of which contained at least one cell and 562 total cells penned. Growth was tracked across each nanopen. Each pen with cells (t<sub>0</sub>) was given a proliferation ratio identified by dividing the final cell count (t<sub>96</sub>) by the starting cell count in the pen. We identified no significant growth differences between the P5, P6, P7, and P8 population subtypes, as shown in <xref ref-type="fig" rid="F6">Figure 6Bi</xref>. However, the population with the most considerable growth based on the calculated proliferation ratio was that which was not processed through the FACS pipeline. We observed a diminishing disparity between Comma-1D subtype-specific growth potential as cell counts in each nanopen at t<sub>0</sub> increase, as shown in <xref ref-type="fig" rid="F6">Figure 6Bii</xref>. Cell concentrations at t<sub>0</sub> and t<sub>96</sub> across all the cells imported in this experiment are presented in <xref ref-type="sec" rid="s9">Supplementary Table S3</xref>.</p>
<p>To improve the image analysis pipeline, a pseudo-sorting platform was engineered to address the current shortcomings witnessed above by Comma-1D cell types processed through FACS. Comma-1D cells were incubated with immunofluorescent markers for <italic>Epcam</italic>, <italic>Sca-1</italic>, and <italic>Cd49f</italic> and then split into sorted and unsorted groups. The sorted group of cells was then processed through FACS to isolate the four subpopulations, as before. On the Beacon microfluidic chip, specific nanopens were dedicated to each subpopulation in the FACS sorted groups. These sorted cells were imported into the nanopens, while also controlling for cell counts in each nanopen. To investigate batch effects on growth, nanopens were allowed up to four cells at t<sub>0</sub>. The remaining nanopens were then allocated to the Comma-1D unsorted population of cells. A total of 562 cells were penned on this microfluidic chip. Using known marker expression parameters from previous iterations, we created a database of image intensities from the sorted population across all the imaging channels on Beacon. This database was used to then identify which subtype (P5, P6, P7, or P8) the unsorted cells represented and served as a pseudo binning tool within the Beacon platform. To visualize this, <xref ref-type="fig" rid="F6">Figure 6C</xref> shows nine images from three separate nanopens. Each row represents the same nano pen at the same timepoint imaged on three fluorescent channels. Outlines were added around each nanopen; green boxes indicate the presence of fluorescence, and red outlines indicate low/no expression. In the top row of images in <xref ref-type="fig" rid="F6">Figure 6C</xref>, the known P8 subpopulation isolated through FACS expressed high levels of <italic>Epcam</italic>, <italic>Cd49f</italic>, and <italic>Sca-1</italic>. This is the expected pattern of expression from the P8 population as identified from scRNASeq data and FACS. In row two of the images in <xref ref-type="fig" rid="F6">Figure 6C</xref>, the unsorted cell A (U<sub>A</sub>) reflects the P8 subpopulation expression pattern by expressing all three markers at a detectable threshold. In contrast, unsorted cell B (U<sub>B</sub>) only significantly expresses <italic>CD49f</italic> and would therefore be categorized as a basal-like cell from the P5 subtype. P5 and P8 cells represent subpopulations that are likely to behave as &#x201c;stem-like&#x201d; and should therefore differentiate and self-renew.</p>
<p>This analysis facilitated pseudo sorting on Beacon and therefore eliminated the need for and the associated cellular stress from FACS. To further optimize this process, a custom MathWorks MATLAB script was developed with the workflow outlined in <xref ref-type="fig" rid="F6">Figure 6D</xref>. Beacon chips are divided into 22 distinct imaging FOV, with all 22 FOVs composing the 3,500 nanopen chip when stitched. To develop the MATLAB script for automated cellular identification and pseudo binning, Comma-1D cells were incubated with immunofluorescent markers for <italic>Epcam</italic>, <italic>Sca-1</italic>, and <italic>Cd49f</italic>, as before. Without processing through FACS, 652 tagged cells were imported onto the chip. The target selection function on Beacon allows for controlled and reproducible image capture of each FOV in each fluorescent channel. To track cell response, a Region of Interest (ROI) is generated for each nanopen ID, as shown in <xref ref-type="fig" rid="F6">Figure 6Di</xref>. By tracking nanopens we can compare populations within those isolated pens at various timepoints and imaging channels. Following this, cell detection was conducted using a circular Hough transform to identify possible cells by circularity within each ROI or nanopen. <xref ref-type="fig" rid="F6">Figure 6Dii</xref> shows all regions detected prior to filtering. Filtering removed region centers not within a generated ROI for nanopens to remove false positives. <xref ref-type="fig" rid="F6">Figure 6Diii</xref> displays filtered cell detection for a given FOV determined by measuring peak brightness at each possible cell location. A measurement reading of 65,535 consistently filtered false positives. Using the center matrix, each detected cell was then measured for fluorescence intensity in each channel on Beacon. This measurement value was normalized by dividing the average image intensity of all nanopen ROIs in that cell-free FOV. This normalization was necessary to compare fluorescence intensity between different FOVs as well as between sample chips as we observe variability in readings. <xref ref-type="fig" rid="F6">Figures 6Div</xref> shows an example of normalized intensity readings for a subsection of a FOV in the TRED channel. Running this analysis across each ROI for each imaging channel generates a matrix of expression readings for each imported cell. To improve pipeline robustness for future assays, rather than employing a definitive threshold to differentiate expression with background readings, K-means clustering was used. Applying K-means clustering to each marker expression and then sorting clusters based on expression levels for each channel and protein serves as an automated binning of cells by surface expression. These bins were then leveraged across the channels to identify combinations that paralleled P5, P6, P7, and P8 subpopulations. <xref ref-type="fig" rid="F6">Figure 6Dv</xref> shows a segment of a sample FOV with the text reflecting the unsupervised cell population each cell is predicted to belong to with a number &#x201c;5&#x201d; representing population group 5, or P5. <xref ref-type="fig" rid="F6">Figure 6Dvi</xref> shows a scatter plot based on <italic>CD49f</italic> and <italic>Epcam</italic> expression, used to differentiate between basal-like and luminal-like cells within each colored cluster. To identify key pens of interest and increase efficiency in visualizing populations of interest, the script automated the export of images of the desired populations across channels. <xref ref-type="fig" rid="F6">Figure 6E</xref> is an example of ROI images captured for some P8 identified cells and the measured intensities are shown as a heatmap. In both experimental runs, the maximum number of cells are penned from one 5&#xa0;&#xb5;l import. Of the 311 nanopens with penned cells in the FACS sorted preliminary experiment, 46 (14.8%) contained P8 sorted cells. The pseudobinning experiment had 176 nanopens with cells, from which 47 (26.7%) nanopens had with P8 identified. This accounts for an 80.4% increase in targeted cell culture count. Utilization of this pseudobinning helped address and prevent cell loss associated with traditional FACS sorting and furthered the image analysis toolset.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>Utilizing scRNASeq data for gene expression analyses in conjunction with high throughput single-cell functional and proteomics data, we have developed a pipeline for both distinct population identification and validation. Through publicly available scRNA analysis tools, including Seurat and Monocle 3, we demonstrated the prediction of functional clusters within complex cell lines like Comma-1D. This heterogeneity highlights the need for further investigation into model systems, as well as high levels of intrinsic heterogeneity that must be considered when interpreting results, as they may confound conclusions of past and current studies.</p>
<p>The Comma-1D cell line is known to functionally differentiate in culture. It, therefore, served as a proxy to highlight the efficacy and resolution of the single-cell suite of methods discussed. Each cell type identified from the scRNASeq data lent toward a population to compare on the functional level for growth capacity. Within the eight subclusters identified from scRNASeq, there is observed partitioning of cells into luminal and epithelial groups. Each partition underwent deep characterization for further clarification on intra-partitional functional heterogeneity.</p>
<p>Luminal cells in the Comma-1D culture were identified as luminal progenitor and luminal differentiated cell types. These results reflect functional groups previously identified in mammary gland tissue, where (<xref ref-type="bibr" rid="B83">Cristea and Polyak, 2018</xref>) summarize luminal stem cell differentiation into either luminal progenitor, ductal, and secretary alveolar cells. Through DGEA and network analysis, a luminal progenitor and differentiated luminal population predicted to be secretory alveolar cells is identified within Comma-1D. Significant expression of immature luminal cell markers such as <italic>Krt7</italic> and <italic>Ehf</italic> are observed in the luminal progenitor cluster; however, we observed expression of differentiated cells markers such as <italic>Krt8</italic> and <italic>Krt18</italic> in that same population. Where (<xref ref-type="bibr" rid="B84">Wang et al., 2001</xref>) identified <italic>Krt8/18</italic> as markers of mature differentiated luminal cells within the prostate, we observed these markers associated with mammary luminal progenitors. These results underscore sources of variability in regard to disease type being investigated and cell line versus tissue gene divergence.</p>
<p>The presence of secretory cells with the absence of a non-secretory cluster within our population leads us to hypothesize two potential scenarios. One scenario is the cell line doesn&#x2019;t fully differentiate into all cell types composing mammary gland function. The other hypothesis is that the non-secretory cells emerge from luminal progenitors at a later stage than alveolar cells, and at the stage of cell isolation and barcoding, the cell line had not yet reached this maturation point. The unclassified progenitor 1 cluster may represent secretory luminal cells that are differentiated and, therefore, are in later stages of the biological process needed to generate mammary gland cell types. Interestingly, the top DEGs in the progenitor 1 cluster are genes associated with keratinocytes and their role in cell-cell/cell-matrix interaction (<italic>Lgals7</italic>), structural components for hemidesmosome formation (<italic>Col17a1</italic>), and fibrous proteins for cellular support (<italic>Krt5</italic>) (<xref ref-type="bibr" rid="B1">Ali et al., 2021</xref>; <xref ref-type="bibr" rid="B20">Ho et al., 2022</xref>). Many of these functions mirror the needs of luminal cells within the mammary gland. Conserved gene expression within luminal cells not observed in the remaining population yield predictive information for patient disease prognosis or treatment. For example, <italic>Wfdc2</italic> encodes the He4 protein, which has already shown significant clinical benefit in monitoring and diagnosing ovarian cancer (<xref ref-type="bibr" rid="B71">Wei et al., 2016</xref>). Additionally, there has been a recent investigation into this marker&#x2019;s application in breast cancer and, based on <italic>Wfdc2</italic> expression isolated in myoepithelial cells, we can predict that its efficacy in determining disease prognosis is more relevant for basal carcinomas than luminal (<xref ref-type="bibr" rid="B10">Chen et al., 2019</xref>).</p>
<p>Unlike the resolved heterogeneity in the luminal population, the myoepithelial cells identified by expression of <italic>Acta2</italic> were populated by clusters labeled myoepithelial 1&#x2013;5 with limited functional granularity. The cnet plots illustrated in <xref ref-type="sec" rid="s9">Supplementary Figure S3</xref> visualize activated pathways in each population respective to the remaining cells in the same partition. Cells in myoepithelial 1 expressed <italic>Mt1</italic>, <italic>Mt2</italic>, and <italic>Bnip3</italic>, which are all direct activation of cellular response to metal ions or response to an inorganic substance (<xref ref-type="bibr" rid="B25">Koh and Lee, 2020</xref>). Metal ions such as Zinc are abundant in humans and play a role in the proliferation and differentiation of mammary epithelial cells (<xref ref-type="bibr" rid="B18">Han et al., 2020</xref>). Myoepithelial two cells significantly expressed <italic>Pttg1</italic> and <italic>Cdc20,</italic> both associated with reproductive processes in cellular development (<xref ref-type="bibr" rid="B45">Noll et al., 2015</xref>). Cells in myoepithelial 3 expressed unique markers such as <italic>Pmepa1</italic>, <italic>Zyx</italic>, and <italic>Cdk1</italic>. <italic>Zyx</italic> is a gene involved in actin reorganization for cell migration and EMT within the murine mammary gland (<xref ref-type="bibr" rid="B40">Mori et al., 2009</xref>). Myoepithelial 4 cells expressed genes such as <italic>Acta2</italic>, <italic>Fn1</italic>, and <italic>Sparc,</italic> which are linked to endothelial cell proliferation and wound healing pathways have been shown to respond within the mammary gland to facilitate healthy lactation function as well as controlling inflammatory response to stress (<xref ref-type="bibr" rid="B58">Ryman et al., 2015</xref>). The gene and pathway hits for this cell population indicate its interaction with the fibroblast cells, supported by their UMAP proximity. Similarly established cell line model IM-2, derived from the fourth mammary glands of pregnant BALB/c mice, demonstrated epithelial-fibroblast interaction in cell culture and its role in structural formation in culture with parallel functional differentiation (<xref ref-type="bibr" rid="B53">Reichmann et al., 1989</xref>). Cells in myoepithelial 5 expressed <italic>Cstb</italic>, <italic>Ptges</italic>, and <italic>Txnrd1,</italic> which are all genes linked to pathways associated with intracellular organelle lumen. These pathways are pivotal within mammary epithelial cells for the production of cytoplasmic lipid droplets, the precursor to milk fat globules (<xref ref-type="bibr" rid="B9">Chanat et al., 2016</xref>). While these pathway indicators don&#x2019;t reveal exact functionality between the myoepithelial clusters, they generate an outline of heterogenous function within a cell line reflecting that of <italic>in-vivo</italic> cell populations. These results point toward a heterogenous myoepithelial population that shares the common function of organizing the mammary ductal network and aiding in milk transport while also retaining independent roles in the process.</p>
<p>Genes conserved in the myoepithelial clusters and lacking significant expression outside that partition provide markers for cell sorting and legacy experimentation. For example, <italic>Lrp1</italic>, which encodes cell surface proteins, provides a gateway to phenotypic cell identification and subsequent sorting for further downstream analysis. With this level of increased single-cell resolution data, we identified gene markers specific to clusters/subpopulations within the Comma-1D cell line (<xref ref-type="sec" rid="s9">Supplementary Table S2</xref>). While extremely important for better resolving which systems can be modeled using Comma-1D, these markers can also be applied to patient single-cell data in parsing cell type populations in the tumor microenvironment.</p>
<p>When integrating the Comma-1D dataset with mouse mammary data from C57BL/6, concordant functional clusters were detected in both populations. The presence of luminal, myoepithelial, and fibroblast cells is identified in both samples. These findings further support the functional heterogeneity in cell lines that needs to be characterized with single-cell assays. Along with the concordant populations, the C57BL/6 data also indicated the presence of populations not initially found from the Comma-1D independent analysis. With the merged data, a ductal luminal population composed of 2,466 cells was identified with 102 (4.14%) of those cells only from Comma-1D. This population is characterized by markers such as <italic>Csn3</italic> and <italic>Wfdc18</italic> (<xref ref-type="sec" rid="s9">Supplementary Figure S4D</xref>). The <italic>Csn3</italic> plays a role in stabilizing milk micelles, a key component of milk production during lactation (<xref ref-type="bibr" rid="B26">Komori et al., 2013</xref>). Both markers have been linked to ductal luminal cells that derive to secretory alveoli cells (<xref ref-type="bibr" rid="B17">Han et al., 2018</xref>). Through this integrated analysis, we confirmed functional heterogeneity observed in Comma-1D reflects populations detected in mouse mammary epithelium.</p>
<p>Orthogonal comparison of stemness markers and pseudotime analysis provides a metric for predicting clusters along with differentiation time points of the Comma-1D population. Monocle 3 was leveraged for pseudotime analysis, where we identify cellular partitioning reflective of the cell clustering from the Seurat analysis. The Comma-1D dataset was reprocessed for dimensionality reduction on Monocle, after which the differentiation trajectory was inferred, and gene expression was plotted to track changes over pseudotime. Supervised pseudotime analysis identified the luminal progenitor population as a possible origin population in one partition of the dataset. The verification of gene-based functional predictions by entropy score validates this assay as a tool for screening progenitor-like cells, particularly beneficial when investigating an uncharacterized population or dataset.</p>
<p>There have been abundant investigations into stemness markers within the mammary gland (<xref ref-type="bibr" rid="B79">Yang et al., 2017</xref>; <xref ref-type="bibr" rid="B82">Zhou et al., 2019</xref>; <xref ref-type="bibr" rid="B14">Engelsen et al., 2020</xref>). These efforts highlight potential co-expression protein combinations that may be utilized for specific stem-like cell populations isolation, including <italic>Lin</italic>
<sup>
<italic>-</italic>
</sup>
<italic>CD29</italic>
<sup>
<italic>high</italic>
</sup>
<italic>CD24</italic>
<sup>
<italic>&#x2b;</italic>
</sup>, <italic>CD44</italic>
<sup>
<italic>&#x2b;</italic>
</sup>
<italic>CD24</italic>
<sup>
<italic>-</italic>
</sup>
<italic>Lin</italic>
<sup>-</sup>, and <italic>ALDH1</italic>
<sup>
<italic>&#x2b;</italic>
</sup>
<italic>Sca-1</italic>
<sup>
<italic>High</italic>
</sup> (<xref ref-type="bibr" rid="B79">Yang et al., 2017</xref>). Despite abundant evidence for the expression of stemness markers within this cell line, there remains no established protocol to define the extent of cell differentiation. Identifying stem cells from genomic profiling is an assumptive process, but any molecular discoveries can now be phenotypically validated using custom pipelines on real-time cellular manipulation platforms such as Beacon.</p>
<p>Intersecting published stemness markers within the mammary gland with our scRNASeq dataset identified <italic>Epcam</italic>
<sup>
<italic>&#x2b;</italic>
</sup>
<italic>, Cd49f</italic> <sup>
<italic>high</italic>
</sup>
<italic>, and Sca-1</italic>
<sup>
<italic>high</italic>
</sup> markers of interest for further investigation. All populations had a subset of cells, P8, expressing all markers except for fibroblast. As we do not expect differentiated fibroblasts to play a role in stemness, this further supports the likelihood that these markers can be utilized in identifying cells that may have stem-like properties. The P8 subpopulation is of interest due to its &#x201c;stem-like&#x201d; properties, where <italic>Sca-1</italic> is a key identifier of Hematopoietic Stem Cells (HSCs) (<xref ref-type="bibr" rid="B39">Morcos et al., 2017</xref>). While the P8 population presents the most potential for stemness based on known marker expression, investigating the other populations lacking expression of one or more of the identified genes also yielded functional identification regarding differentiation and proliferation capability. Determining functional differences from just scRNASeq data is not direct; however, we can pair the inferences made from this pipeline to observe and validate phenotypic differences between cell populations. Through the linkage of high throughput single-cell data generation pipelines across multiple cellular variables, we were able to gain deeper insight into single-cell functional heterogeneity.</p>
<p>Platforms like Beacon provide a high throughput single-cell testing method to address the emerging need to further investigate and validate the predicted phenotypic variants within a population determined from assays such as scRNASeq (<xref ref-type="bibr" rid="B37">Maddaly et al., 2017</xref>; <xref ref-type="bibr" rid="B13">Duarte et al., 2018</xref>; <xref ref-type="bibr" rid="B23">Kapalczynska et al., 2018</xref>; <xref ref-type="bibr" rid="B59">Sachs et al., 2018</xref>; <xref ref-type="bibr" rid="B63">Takebe et al., 2018</xref>; <xref ref-type="bibr" rid="B76">Xu et al., 2018</xref>; <xref ref-type="bibr" rid="B73">Xia et al., 2019</xref>). The Beacon instrument contains a 3-axis platform with four nests for cell culturing in four isolated chips. An imaging cube is fixed above the nest for imaging in 4 fluorescent channels: FITC, CY5, DAPI, and TRED. Parallel to conventional organoid growth protocols, optimizing Matrigel concentration, cellular penning parameters, media conditions, and fluidics chip conditioning was required (<xref ref-type="bibr" rid="B31">Le Gac and van den Berg, 2012</xref>). While cell growth has been selectively demonstrated on this platform for Comma-1D, multidimensional variability can activate distinct cell pathways and requires iteration for each biologic model (<xref ref-type="bibr" rid="B5">Beaumont et al., 2022</xref>).</p>
<p>scRNA sequencing provides high resolution data for subpopulation identification. We used this data to predict functional subgrouping within a population to understand the sources of disease progression and metastasis. Through scRNASeq and protein-level comparisons, the 4 populations in <xref ref-type="table" rid="T2">Table 2</xref> were identified based on the expression of <italic>Epcam, Cd49f,</italic> and <italic>Sca-1</italic>. Comma-1D cells from culture were sorted using FACS for surface expression of the given markers and imported onto a Beacon chip along with unsorted Comma-1D cells from the same culture. Distributions of t<sub>0</sub> and t<sub>f</sub> counts are outlined in <xref ref-type="sec" rid="s9">Supplementary Table S3</xref> and a summary of nanopen and cell counts in this experiment is outlined in <xref ref-type="sec" rid="s9">Supplementary Table S4</xref>. We observed significant growth in the unsorted population compared to the sorted P5, P6, P7, and P8 populations. While FACS allows high throughput sorting, current sorting systems have been shown to result in cellular stress, as described above, and diluted concentrations of rare cell populations (<xref ref-type="bibr" rid="B60">Sauvat et al., 2015</xref>; <xref ref-type="bibr" rid="B36">Llufrio et al., 2018</xref>). This result may be due to either flow-based sorting neglecting key cells of interest that skew proliferation or effects on cell expression due to the sorting process that inhibited proliferation. In either case, we believe that flow sorting compounded with the microfluidic and OEP cell importing of Beacon resulted in cell stress activation that potentially inhibited cell growth on-chip. These factors become more significant when processing patient samples where cellular stress and rare cell loss are already impacted (<xref ref-type="bibr" rid="B55">Reuben et al., 2015</xref>). As the initial count of cells at t<sub>0</sub> increases, we observe a depreciating disparity between sorted and unsorted cell growth. This could be due to microenvironment changes that initiate cell adherence and growth from intercellular signaling. Further investigation will be performed to gain insight into defining cell subpopulations and their individual delta on the impacts of the microenvironment and cell aggregate growth.</p>
<p>Fromthe preliminary growth data described above, we observed that this cellular stress reduced cell growth during the Beacon culture period. To address this, we leveraged the imaging channels on the Beacon instrument to identify populations of interest from unsorted Comma-1D cells that were incubated with fluorescent markers of <italic>Epcam, Cd49f,</italic> and <italic>Sca-1</italic>. The three fluorescent imaging channels were paired to independent markers, and each nanopen was imaged on each channel at 12 h interval timepoints. After subtracting expression readings with baseline values determined from empty nanopen readings and normalizing measurement readings from background, we generate expression vectors for each cell in each nanopen across imaging channels. These vectors allow pseudo-binning of unidentified cells into populations of interest. Since our P8 cells of interest are rare in the population, utilizing this pseudo-sorting capability also bypassed processing steps such as centrifuging that are conventionally necessary for FACS, further reducing cell loss and improving cell viability. After numerous iterations on Beacon, we refined our import and culturing protocol resulting in reliable cell adhesion and growth from a subset of cells. The MATLAB image analysis script allowed bypassing of FACS, preventing loss of rare cells and reducing cellular stress. Similar analyses of novel cell marker expression and single-cell growth data will likely yield the highest throughput analysis of cell subtype effects on cancer malignancy potential. The built-in cell analysis platform could not be used in this study due to compromised control on time point comparisons, as well as no available sorting algorithm for penned cells. The custom method presented here can be used more generally for high throughput separation and image analysis to focus on pathologic or other cells of interest.</p>
<p>Celllines are used across disciplines and have unknown levels of subpopulation variability, which can alter the ability to draw definitive conclusions from <italic>in vitro</italic> studies. In the case of therapeutic development, <italic>in vitro</italic>, human cell lines have been key systems for predicting both efficacy and toxicity of drugs (<xref ref-type="bibr" rid="B2">Allen et al., 2005</xref>). For the Comma-1D line, which here was identified to contain two cell partitions composed of eight clusters, it is not unlikely that certain subtypes would respond differently to therapy than others. Moreover, it is a cell line with a background of known differentiation, so we may see a more drastically heterogeneous population as compared to other breast model lines (<xref ref-type="bibr" rid="B68">Vachon and Beaulieu, 1992</xref>; <xref ref-type="bibr" rid="B70">Vranic et al., 2011</xref>). As the standard of oncology treatment moves toward targeted therapies, our understanding of model systems used as the first line of testing needs to be improved through higher resolution characterization (<xref ref-type="bibr" rid="B33">Levine, 2000</xref>; <xref ref-type="bibr" rid="B66">Tripathy, 2002</xref>; <xref ref-type="bibr" rid="B4">Arruebo et al., 2011</xref>; <xref ref-type="bibr" rid="B46">Nounou et al., 2015</xref>). Further scRNA investigation paired with phenotypic observations can provide the needed level of deep insight into cell populations used for these types of critical studies.</p>
<p>We present here an assay for identifying and monitoring functional characteristics of single cells at a high throughput level. Using a custom pseudo sorting script, we identify cell subtypes across up to 3,500 pens on the Beacon platform. Each of the pens and respective cells were tracked for growth response. By utilizing the automated script, we also prevented the loss of rare cells typically observed in flow sorting and reduced cellular stress allowing for improved growth. With this process established, we laid the foundation for the application of these analyses to varied cell lines modeling a wide variety of disease states. Furthermore, we can apply this pipeline to patient samples to diminish processing times and the impact of sample handling currently applied by FACS. By reducing the time between sample collection and functional assay, we will preserve sample quality and obtain a more accurate understanding of the patient&#x2019;s disease state. Ultimately, the development of high throughput single-cell multi-data assays can resolve the contribution of various tumor microenvironment components to disease pathogenesis and tumor metastasis. This information can be leveraged for high throughput single-cell assays to quantify therapeutic response, classify differentiation heterogeneity in generated models, and validate the conclusions identified from single-cell sequencing.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>, GSE182589.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>AD: Conceptualization, data curation, formal analysis, investigation, methodology, project administration, resources, software, validation, visualization, writing. EN: Cell culture. DC: formal analysis. MB, MS, KB, and JS: Review and editing. RS: Conceptualization, funding acquisition, supervision, validation, writing &#x2013; review, and editing.</p>
</sec>
<sec sec-type="COI-statement" id="s7">
<title>Conflict of Interest</title>
<p>RS is employed by Sema4.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s8">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s9">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2022.894597/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2022.894597/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Image3.JPEG" id="SM1" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image1.JPEG" id="SM2" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image4.JPEG" id="SM3" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image2.JPEG" id="SM4" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image5.JPEG" id="SM5" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.xlsx" id="SM6" mimetype="application/xlsx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ali</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Alhattab</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Jafar</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Alzubide</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sharar</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Bdour</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Differential Marker Expression between Keratinocyte Stem Cells and Their Progeny Generated from a Single Colony</article-title>. <source>Int. J. Mol. Sci.</source> <volume>22</volume> (<issue>19</issue>). <pub-id pub-id-type="doi">10.3390/ijms221910810</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Allen</surname>
<given-names>D. D.</given-names>
</name>
<name>
<surname>Caviedes</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Cardenas</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Shimahara</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Segura-Aguilar</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Caviedes</surname>
<given-names>P. A.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Cell Lines as <italic>In Vitro</italic> Models for Drug Screening and Toxicity Studies</article-title>. <source>Drug Dev. Ind. Pharm.</source> <volume>31</volume> (<issue>8</issue>), <fpage>757</fpage>&#x2013;<lpage>768</lpage>. <pub-id pub-id-type="doi">10.1080/03639040500216246</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anderson</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Rudolph</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>McManaman</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Neville</surname>
<given-names>M. C.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Key Stages in Mammary Gland Development. Secretory Activation in the Mammary Gland: It&#x27;s Not Just about Milk Protein Synthesis</article-title>. <source>Breast Cancer Res.</source> <volume>9</volume> (<issue>1</issue>), <fpage>204</fpage>. <pub-id pub-id-type="doi">10.1186/bcr1653</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arruebo</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Vilaboa</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Saez-Gutierrez</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Lambea</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tres</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Valladares</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Assessment of the Evolution of Cancer Treatment Therapies</article-title>. <source>Cancers (Basel)</source> <volume>3</volume> (<issue>3</issue>), <fpage>3279</fpage>&#x2013;<lpage>3330</lpage>. <pub-id pub-id-type="doi">10.3390/cancers3033279</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beaumont</surname>
<given-names>K. G.</given-names>
</name>
<name>
<surname>Andreou</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Ellis</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Sebra</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Multiparameter Single-Cell Characterization of Ovarian Intratumor Heterogeneity</article-title>. <source>Methods Mol. Biol.</source> <volume>2424</volume>, <fpage>135</fpage>&#x2013;<lpage>146</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-0716-1956-8_8</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Booth</surname>
<given-names>B. W.</given-names>
</name>
<name>
<surname>Boulanger</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>G. H.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Alveolar Progenitor Cells Develop in Mouse Mammary Glands Independent of Pregnancy and Lactation</article-title>. <source>J. Cell. Physiol.</source> <volume>212</volume> (<issue>3</issue>), <fpage>729</fpage>&#x2013;<lpage>736</lpage>. <pub-id pub-id-type="doi">10.1002/jcp.21071</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Butler</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hoffman</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Smibert</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Papalexi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Satija</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Integrating Single-Cell Transcriptomic Data across Different Conditions, Technologies, and Species</article-title>. <source>Nat. Biotechnol.</source> <volume>36</volume> (<issue>5</issue>), <fpage>411</fpage>&#x2013;<lpage>420</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.4096</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cancer Genome Atlas Research</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Weinstein</surname>
<given-names>J. N.</given-names>
</name>
<name>
<surname>Collisson</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Mills</surname>
<given-names>G. B.</given-names>
</name>
<name>
<surname>Shaw</surname>
<given-names>K. R.</given-names>
</name>
<name>
<surname>Ozenberger</surname>
<given-names>B. A.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>The Cancer Genome Atlas Pan-Cancer Analysis Project</article-title>. <source>Nat. Genet.</source> <volume>45</volume> (<issue>10</issue>), <fpage>1113</fpage>&#x2013;<lpage>1120</lpage>. <pub-id pub-id-type="doi">10.1038/ng.2764</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chanat</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Le Parc</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lahouassa</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Badaoui</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Isolation of Endoplasmic Reticulum Fractions from Mammary Epithelial Tissue</article-title>. <source>J. Mammary Gland. Biol. Neoplasia</source> <volume>21</volume> (<issue>1-2</issue>), <fpage>1</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1007/s10911-016-9351-x</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.-L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>WFDC2 Contributes to Epithelial&#x26;ndash;mesenchymal Transition (EMT) by Activating AKT Signaling Pathway and Regulating MMP-2 Expression</article-title>. <source>Cmar</source> <volume>Vol. 11</volume>, <fpage>2415</fpage>&#x2013;<lpage>2424</lpage>. <pub-id pub-id-type="doi">10.2147/cmar.s192950</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cidado</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>H. Y.</given-names>
</name>
<name>
<surname>Rosen</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Cimino-Mathews</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Garay</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Fessler</surname>
<given-names>A. G.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Ki-67 Is Required for Maintenance of Cancer Stem Cells but Not Cell Proliferation</article-title>. <source>Oncotarget</source> <volume>7</volume> (<issue>5</issue>), <fpage>6281</fpage>&#x2013;<lpage>6293</lpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.7057</pub-id> </citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cristea</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Polyak</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Dissecting the Mammary Gland One Cell at a Time</article-title>. <source>Nat. Commun.</source> <volume>9</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>3</lpage>. </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Danielson</surname>
<given-names>K. G.</given-names>
</name>
<name>
<surname>Oborn</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Durban</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Butel</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Medina</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>1984</year>). <article-title>Epithelial Mouse Mammary Cell Line Exhibiting Normal Morphogenesis <italic>In Vivo</italic> and Functional Differentiation <italic>In Vitro</italic>
</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>81</volume> (<issue>12</issue>), <fpage>3756</fpage>&#x2013;<lpage>3760</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.81.12.3756</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Duarte</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Gogola</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Sachs</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Barazas</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Annunziato</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>BRCA-deficient Mouse Mammary Tumor Organoids to Study Cancer-Drug Resistance</article-title>. <source>Nat. Methods</source> <volume>15</volume> (<issue>2</issue>), <fpage>134</fpage>&#x2013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4535</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Engelsen</surname>
<given-names>A. S. T.</given-names>
</name>
<name>
<surname>Wnuk-Lipinska</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Bougnaud</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pelissier Vatter</surname>
<given-names>F. A.</given-names>
</name>
<name>
<surname>Tiron</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Villadsen</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>AXL Is a Driver of Stemness in Normal Mammary Gland and Breast Cancer</article-title>. <source>iScience</source> <volume>23</volume> (<issue>11</issue>), <fpage>101649</fpage>. <pub-id pub-id-type="doi">10.1016/j.isci.2020.101649</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Freytag</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>L&#xf6;nnstedt</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bahlo</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>10002018</year>). <article-title>Comparison of Clustering Tools in R for Medium-Sized 10x Genomics Single-Cell RNA-Sequencing Data</article-title>. <source>F1000Res</source> <volume>7</volume>, <fpage>1297</fpage>. <pub-id pub-id-type="doi">10.12688/f1000research.15809.2</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gaiser</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>L&#xe4;mmermann</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Igyarto</surname>
<given-names>B. Z.</given-names>
</name>
<name>
<surname>Kaplan</surname>
<given-names>D. H.</given-names>
</name>
<name>
<surname>Tessarollo</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Cancer-associated Epithelial Cell Adhesion Molecule (EpCAM; CD326) Enables Epidermal Langerhans Cell Motility and Migration <italic>In Vivo</italic>
</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>109</volume> (<issue>15</issue>), <fpage>E889</fpage>&#x2013;<lpage>E897</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1117674109</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Fei</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Lai</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Mapping the Mouse Cell Atlas by Microwell-Seq</article-title>. <source>Cell.</source> <volume>173</volume> (<issue>5</issue>), <fpage>1307</fpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2018.05.012</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sanford</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Simpson</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Dowell</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Palmer</surname>
<given-names>A. E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Remodeling of Zn2&#x2b; Homeostasis upon Differentiation of Mammary Epithelial Cells</article-title>. <source>Metallomics</source> <volume>12</volume> (<issue>3</issue>), <fpage>346</fpage>&#x2013;<lpage>362</lpage>. <pub-id pub-id-type="doi">10.1039/c9mt00301k</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hens</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Wysolmerski</surname>
<given-names>J. J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Key Stages of Mammary Gland Development: Molecular Mechanisms Involved in the Formation of the Embryonic Mammary Gland</article-title>. <source>Breast Cancer Res.</source> <volume>7</volume> (<issue>5</issue>), <fpage>220</fpage>&#x2013;<lpage>224</lpage>. <pub-id pub-id-type="doi">10.1186/bcr1306</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ho</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Thompson</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Fisk</surname>
<given-names>J. N.</given-names>
</name>
<name>
<surname>Nebert</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Bruford</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Vasiliou</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Update of the Keratin Gene Family: Evolution, Tissue-specific Expression Patterns, and Relevance to Clinical Disorders</article-title>. <source>Hum. Genomics</source> <volume>16</volume> (<issue>1</issue>), <fpage>1</fpage>. <pub-id pub-id-type="doi">10.1186/s40246-021-00374-9</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Generoso</surname>
<given-names>S. F.</given-names>
</name>
<name>
<surname>Badia</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Payer</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Carey</surname>
<given-names>L. B.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A Conserved Expression Signature Predicts Growth Rate and Reveals Cell &#x26; Lineage-specific Differences</article-title>. <source>PLoS Comput. Biol.</source> <volume>17</volume> (<issue>11</issue>), <fpage>e1009582</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1009582</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jones</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Mackay</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Grigoriadis</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cossu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Reis-Filho</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Fulford</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2004</year>). <article-title>Expression Profiling of Purified Normal Human Luminal and Myoepithelial Breast Cells: Identification of Novel Prognostic Markers for Breast Cancer</article-title>. <source>Cancer Res.</source> <volume>64</volume> (<issue>9</issue>), <fpage>3037</fpage>&#x2013;<lpage>3045</lpage>. <pub-id pub-id-type="doi">10.1158/0008-5472.can-03-2028</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kapalczynska</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kolenda</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Przybyla</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zajaczkowska</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Teresiak</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Filas</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>2D and 3D Cell Cultures - a Comparison of Different Types of Cancer Cell Cultures</article-title>. <source>Arch. Med. Sci.</source> <volume>14</volume> (<issue>4</issue>), <fpage>910</fpage>&#x2013;<lpage>919</lpage>. </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kimmerling</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Prakadan</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Gupta</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Calistri</surname>
<given-names>N. L.</given-names>
</name>
<name>
<surname>Stevens</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Olcum</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Linking Single-Cell Measurements of Mass, Growth Rate, and Gene Expression</article-title>. <source>Genome Biol.</source> <volume>19</volume> (<issue>1</issue>), <fpage>207</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-018-1576-0</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koh</surname>
<given-names>J.-Y.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.-J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Metallothionein-3 as a Multifunctional Player in the Control of Cellular Processes and Diseases</article-title>. <source>Mol. Brain</source> <volume>13</volume> (<issue>1</issue>), <fpage>116</fpage>. <pub-id pub-id-type="doi">10.1186/s13041-020-00654-w</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Komori</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kobayashi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Matsuo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kino</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Miyazawa</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Csn3 Gene Is Regulated by All-Trans Retinoic Acid during Neural Differentiation in Mouse P19 Cells</article-title>. <source>PLoS One</source> <volume>8</volume> (<issue>4</issue>), <fpage>e61938</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0061938</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kondov</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Milenkovikj</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Kondov</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Petrushevska</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Basheska</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Bogdanovska-Todorovska</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Presentation of the Molecular Subtypes of Breast Cancer Detected by Immunohistochemistry in Surgically Treated Patients</article-title>. <source>Open Access Maced. J. Med. Sci.</source> <volume>6</volume> (<issue>6</issue>), <fpage>961</fpage>&#x2013;<lpage>967</lpage>. <pub-id pub-id-type="doi">10.3889/oamjms.2018.231</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Korsunsky</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Millard</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Slowikowski</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Fast, Sensitive and Accurate Integration of Single-Cell Data with Harmony</article-title>. <source>Nat. Methods</source> <volume>16</volume> (<issue>12</issue>), <fpage>1289</fpage>&#x2013;<lpage>1296</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-019-0619-0</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krebsbach</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Villa-Diaz</surname>
<given-names>L. G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The Role of Integrin &#x3b1;6 (CD49f) in Stem Cells: More Than a Conserved Biomarker</article-title>. <source>Stem Cells Dev.</source> <volume>26</volume> (<issue>15</issue>), <fpage>1090</fpage>&#x2013;<lpage>1099</lpage>. <pub-id pub-id-type="doi">10.1089/scd.2016.0319</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumar</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Prasad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bhat-Nakshatri</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Anjanappa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kalra</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Marino</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Normal Breast-Derived Epithelial Cells with Luminal and Intrinsic Subtype-Enriched Gene Expression Document Interindividual Differences in Their Differentiation Cascade</article-title>. <source>Cancer Res.</source> <volume>78</volume> (<issue>17</issue>), <fpage>5107</fpage>&#x2013;<lpage>5123</lpage>. <pub-id pub-id-type="doi">10.1158/0008-5472.can-18-0509</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le Gac</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>van den Berg</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Single Cell Electroporation Using Microfluidic Devices</article-title>. <source>Methods Mol. Biol.</source> <volume>853</volume>, <fpage>65</fpage>&#x2013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-61779-567-1_7</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lehmann</surname>
<given-names>B. D.</given-names>
</name>
<name>
<surname>Jovanovi&#x107;</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Estrada</surname>
<given-names>M. V.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>K. N.</given-names>
</name>
<name>
<surname>Shyr</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Refinement of Triple-Negative Breast Cancer Molecular Subtypes: Implications for Neoadjuvant Chemotherapy Selection</article-title>. <source>PLoS One</source> <volume>11</volume> (<issue>6</issue>), <fpage>e0157368</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0157368</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Levine</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Epirubicin in Breast Cancer: Present and Future</article-title>. <source>Clin. Breast Cancer</source> <volume>1</volume> (<issue>Suppl. 1</issue>), <fpage>S62</fpage>&#x2013;<lpage>S67</lpage>. <pub-id pub-id-type="doi">10.3816/cbc.2000.s.012</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lichtner</surname>
<given-names>R. B.</given-names>
</name>
<name>
<surname>Julian</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>North</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Glasser</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Nicolson</surname>
<given-names>G. L.</given-names>
</name>
</person-group> (<year>1991</year>). <article-title>Coexpression of Cytokeratins Characteristic for Myoepithelial and Luminal Cell Lineages in Rat 13762NF Mammary Adenocarcinoma Tumors and Their Spontaneous Metastases</article-title>. <source>Cancer Res.</source> <volume>51</volume> (<issue>21</issue>), <fpage>5943</fpage>&#x2013;<lpage>5950</lpage>. </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bai</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ning</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Bispecific Antibody Targeting TROP2xCD3 Suppresses Tumor Growth of Triple Negative Breast Cancer</article-title>. <source>J. Immunother. Cancer</source> <volume>9</volume> (<issue>10</issue>). <pub-id pub-id-type="doi">10.1136/jitc-2021-003468</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Llufrio</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Naser</surname>
<given-names>F. J.</given-names>
</name>
<name>
<surname>Patti</surname>
<given-names>G. J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Sorting Cells Alters Their Redox State and Cellular Metabolome</article-title>. <source>Redox Biol.</source> <volume>16</volume>, <fpage>381</fpage>&#x2013;<lpage>387</lpage>. <pub-id pub-id-type="doi">10.1016/j.redox.2018.03.004</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maddaly</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Subramaniyan</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Balasubramanian</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Cancer Cytokines and the Relevance of 3D Cultures for Studying Those Implicated in Human Cancers</article-title>. <source>J. Cell. Biochem.</source> <volume>118</volume> (<issue>9</issue>), <fpage>2544</fpage>&#x2013;<lpage>2558</lpage>. <pub-id pub-id-type="doi">10.1002/jcb.25970</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Malhotra</surname>
<given-names>G. K.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Band</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Band</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Histological, Molecular and Functional Subtypes of Breast Cancers</article-title>. <source>Cancer Biol. Ther.</source> <volume>10</volume> (<issue>10</issue>), <fpage>955</fpage>&#x2013;<lpage>960</lpage>. <pub-id pub-id-type="doi">10.4161/cbt.10.10.13879</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Morcos</surname>
<given-names>M. N. F.</given-names>
</name>
<name>
<surname>Schoedel</surname>
<given-names>K. B.</given-names>
</name>
<name>
<surname>Hoppe</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Behrendt</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Basak</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Clevers</surname>
<given-names>H. C.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>SCA-1 Expression Level Identifies Quiescent Hematopoietic Stem and Progenitor Cells</article-title>. <source>Stem Cell. Rep.</source> <volume>8</volume> (<issue>6</issue>), <fpage>1472</fpage>&#x2013;<lpage>1478</lpage>. <pub-id pub-id-type="doi">10.1016/j.stemcr.2017.04.012</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mori</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nakagami</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Koibuchi</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Miura</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Takami</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Koriyama</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Zyxin Mediates Actin Fiber Reorganization in Epithelial-Mesenchymal Transition and Contributes to Endocardial Morphogenesis</article-title>. <source>MBoC</source> <volume>20</volume> (<issue>13</issue>), <fpage>3115</fpage>&#x2013;<lpage>3124</lpage>. <pub-id pub-id-type="doi">10.1091/mbc.e09-01-0046</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moritani</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ichihara</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yatabe</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hasegawa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Iwakoshi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hosoda</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Immunohistochemical Expression of Myoepithelial Markers in Adenomyoepithelioma of the Breast: a Unique Paradoxical Staining Pattern of High-Molecular Weight Cytokeratins</article-title>. <source>Virchows Arch.</source> <volume>466</volume> (<issue>2</issue>), <fpage>191</fpage>&#x2013;<lpage>198</lpage>. <pub-id pub-id-type="doi">10.1007/s00428-014-1687-2</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muhl</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Genov&#xe9;</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Leptidis</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Mocci</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Single-cell Analysis Uncovers Fibroblast Heterogeneity and Criteria for Fibroblast and Mural Cell Identification and Discrimination</article-title>. <source>Nat. Commun.</source> <volume>11</volume> (<issue>1</issue>), <fpage>3953</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-17740-1</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muzio</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Maggiora</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Paiuzzi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Oraldi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Canuto</surname>
<given-names>R. A.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Aldehyde Dehydrogenases and Cell Proliferation</article-title>. <source>Free Radic. Biol. Med.</source> <volume>52</volume> (<issue>4</issue>), <fpage>735</fpage>&#x2013;<lpage>746</lpage>. <pub-id pub-id-type="doi">10.1016/j.freeradbiomed.2011.11.033</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Newman</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Gentles</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Robust Enumeration of Cell Subsets from Tissue Expression Profiles</article-title>. <source>Nat. Methods</source> <volume>12</volume> (<issue>5</issue>), <fpage>453</fpage>&#x2013;<lpage>457</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.3337</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Noll</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Vandyke</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Hewett</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Mrozik</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Bala</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>S. A.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>PTTG1 Expression Is Associated with Hyperproliferative Disease and Poor Prognosis in Multiple Myeloma</article-title>. <source>J. Hematol. Oncol.</source> <volume>8</volume>, <fpage>106</fpage>. <pub-id pub-id-type="doi">10.1186/s13045-015-0209-2</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nounou</surname>
<given-names>M. I.</given-names>
</name>
<name>
<surname>ElAmrawy</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Abdelraouf</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Goda</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Syed-Sha-Qhattal</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Breast Cancer: Conventional Diagnosis and Treatment Modalities and Recent Patents and Technologies</article-title>. <source>Breast Cancer (Auckl)</source> <volume>9</volume> (<issue>Suppl. 2</issue>), <fpage>17</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.4137/BCBCR.S29420</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olsen</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Peltonen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jaakkola</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Uitto</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1989</year>). <article-title>Collagen Gene Expression by Cultured Human Skin Fibroblasts. Abundant Steady-State Levels of Type VI Procollagen Messenger RNAs</article-title>. <source>J. Clin. Investig.</source> <volume>83</volume> (<issue>3</issue>), <fpage>791</fpage>&#x2013;<lpage>795</lpage>. <pub-id pub-id-type="doi">10.1172/jci113959</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Osborne</surname>
<given-names>C. K.</given-names>
</name>
<name>
<surname>Hobbs</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Trent</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>Biological Differences Among MCF-7 Human Breast Cancer Cell Lines from Different Laboratories</article-title>. <source>Breast Cancer Res. Tr.</source> <volume>9</volume> (<issue>2</issue>), <fpage>111</fpage>&#x2013;<lpage>121</lpage>. <pub-id pub-id-type="doi">10.1007/bf01807363</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pal</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Milevskiy</surname>
<given-names>M. J. G.</given-names>
</name>
<name>
<surname>Vaillant</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Prokopuk</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Dawson</surname>
<given-names>C. A.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Single Cell Transcriptome Atlas of Mouse Mammary Epithelial Cells across Development</article-title>. <source>Breast Cancer Res.</source> <volume>23</volume> (<issue>1</issue>), <fpage>69</fpage>. <pub-id pub-id-type="doi">10.1186/s13058-021-01445-4</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paul</surname>
<given-names>C. D.</given-names>
</name>
<name>
<surname>Mistriotis</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Konstantopoulos</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Cancer Cell Motility: Lessons from Migration in Confined Spaces</article-title>. <source>Nat. Rev. Cancer</source> <volume>17</volume> (<issue>2</issue>), <fpage>131</fpage>&#x2013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1038/nrc.2016.123</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Petitti</surname>
<given-names>D. B.</given-names>
</name>
<name>
<surname>Perlman</surname>
<given-names>J. A.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Re: "a Prospective Cohort Study of Postmenopausal Hormone Use and Risk of Breast Cancer in Us Women"</article-title>. <source>Am. J. Epidemiol.</source> <volume>127</volume> (<issue>4</issue>), <fpage>883</fpage>. <pub-id pub-id-type="doi">10.1093/oxfordjournals.aje.a114876</pub-id> </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prater</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Petit</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Alasdair Russell</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Giraddi</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Shehata</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Menon</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Mammary Stem Cells Have Myoepithelial Cell Properties</article-title>. <source>Nat. Cell. Biol.</source> <volume>16</volume> (<issue>10</issue>), <fpage>9421</fpage>&#x2013;<lpage>9507</lpage>. <pub-id pub-id-type="doi">10.1038/ncb3025</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reichmann</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ball</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Groner</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Friis</surname>
<given-names>R. R.</given-names>
</name>
</person-group> (<year>1989</year>). <article-title>New Mammary Epithelial and Fibroblastic Cell Clones in Coculture Form Structures Competent to Differentiate Functionally</article-title>. <source>J. Cell. Biol.</source> <volume>108</volume> (<issue>3</issue>), <fpage>1127</fpage>&#x2013;<lpage>1138</lpage>. <pub-id pub-id-type="doi">10.1083/jcb.108.3.1127</pub-id> </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ren</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Understanding Tumor Ecosystems by Single-Cell Sequencing: Promises and Limitations</article-title>. <source>Genome Biol.</source> <volume>19</volume> (<issue>1</issue>), <fpage>211</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-018-1593-z</pub-id> </citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reuben</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gopalakrishnan</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Wagner</surname>
<given-names>H. E.</given-names>
</name>
<name>
<surname>Spencer</surname>
<given-names>C. N.</given-names>
</name>
<name>
<surname>Austin-Breneman</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Working with Human Tissues for Translational Cancer Research</article-title>. <source>J. Vis. Exp.</source> <volume>105</volume>. <pub-id pub-id-type="doi">10.3791/53189</pub-id> </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ricardo</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Phelan</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Trypsinizing and Subculturing Mammalian Cells</article-title>. <source>J. Vis. Exp.</source> (<issue>16</issue>). <pub-id pub-id-type="doi">10.3791/755</pub-id> </citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ricardo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Vieira</surname>
<given-names>A. F.</given-names>
</name>
<name>
<surname>Gerhard</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Leitao</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Pinto</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Cameselle-Teijeiro</surname>
<given-names>J. F.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Breast Cancer Stem Cell Markers CD44, CD24 and ALDH1: Expression Distribution within Intrinsic Molecular Subtype</article-title>. <source>J. Clin. Pathology</source> <volume>64</volume> (<issue>11</issue>), <fpage>937</fpage>&#x2013;<lpage>946</lpage>. <pub-id pub-id-type="doi">10.1136/jcp.2011.090456</pub-id> </citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ryman</surname>
<given-names>V. E.</given-names>
</name>
<name>
<surname>Packiriswamy</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Sordillo</surname>
<given-names>L. M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Role of Endothelial Cells in Bovine Mammary Gland Health and Disease</article-title>. <source>Anim. Health. Res. Rev.</source> <volume>16</volume> (<issue>2</issue>), <fpage>135</fpage>&#x2013;<lpage>149</lpage>. <pub-id pub-id-type="doi">10.1017/s1466252315000158</pub-id> </citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sachs</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>de Ligt</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kopper</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Gogola</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Bounova</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Weeber</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>A Living Biobank of Breast Cancer Organoids Captures Disease Heterogeneity</article-title>. <source>Cell.</source> <volume>172</volume> (<issue>1-2</issue>), <fpage>373</fpage>&#x2013;<lpage>e10</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2017.11.010</pub-id> </citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sauvat</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Segura</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Spaggiari</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Muller</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Quantification of Cellular Viability by Automated Microscopy and Flow Cytometry</article-title>. <source>Oncotarget</source> <volume>6</volume> (<issue>11</issue>), <fpage>9467</fpage>&#x2013;<lpage>9475</lpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.3266</pub-id> </citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Slepicka</surname>
<given-names>P. F.</given-names>
</name>
<name>
<surname>Cyrill</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Dos Santos</surname>
<given-names>C. O.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Pregnancy and Breast Cancer: Pathways to Understand Risk and Prevention</article-title>. <source>Trends Mol. Med.</source> <volume>25</volume> (<issue>10</issue>), <fpage>866</fpage>&#x2013;<lpage>881</lpage>. <pub-id pub-id-type="doi">10.1016/j.molmed.2019.06.003</pub-id> </citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Svensson</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Natarajan</surname>
<given-names>K. N.</given-names>
</name>
<name>
<surname>Ly</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>Miragaia</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Labalette</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Macaulay</surname>
<given-names>I. C.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Power Analysis of Single-Cell RNA-Sequencing Experiments</article-title>. <source>Nat. Methods</source> <volume>14</volume> (<issue>4</issue>), <fpage>381</fpage>&#x2013;<lpage>387</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4220</pub-id> </citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Takebe</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wells</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Helmrath</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Zorn</surname>
<given-names>A. M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Organoid Center Strategies for Accelerating Clinical Translation</article-title>. <source>Cell. Stem Cell.</source> <volume>22</volume> (<issue>6</issue>), <fpage>806</fpage>&#x2013;<lpage>809</lpage>. <pub-id pub-id-type="doi">10.1016/j.stem.2018.05.008</pub-id> </citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Teschendorff</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Enver</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Single-cell Entropy for Accurate Estimation of Differentiation Potency from a Cell&#x27;s Transcriptome</article-title>. <source>Nat. Commun.</source> <volume>8</volume>, <fpage>15599</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms15599</pub-id> </citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Trapnell</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Cacchiarelli</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Grimsby</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pokharel</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Morse</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>The Dynamics and Regulators of Cell Fate Decisions Are Revealed by Pseudotemporal Ordering of Single Cells</article-title>. <source>Nat. Biotechnol.</source> <volume>32</volume> (<issue>4</issue>), <fpage>381</fpage>&#x2013;<lpage>386</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.2859</pub-id> </citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tripathy</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Gemcitabine in Breast Cancer: Future Directions</article-title>. <source>Clin. Breast Cancer</source> <volume>3</volume> (<issue>Suppl. 1</issue>), <fpage>45</fpage>&#x2013;<lpage>48</lpage>. <pub-id pub-id-type="doi">10.3816/cbc.2002.s.010</pub-id> </citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Twigger</surname>
<given-names>A.-J.</given-names>
</name>
<name>
<surname>Hepworth</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Tat Lai</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chetwynd</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Stuebe</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Blancafort</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Gene Expression in Breastmilk Cells Is Associated with Maternal and Infant Characteristics</article-title>. <source>Sci. Rep.</source> <volume>5</volume>, <fpage>12933</fpage>. <pub-id pub-id-type="doi">10.1038/srep12933</pub-id> </citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vachon</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Beaulieu</surname>
<given-names>J. F.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>Transient Mosaic Patterns of Morphological and Functional Differentiation in the Caco-2 Cell Line</article-title>. <source>Gastroenterology</source> <volume>103</volume> (<issue>2</issue>), <fpage>414</fpage>&#x2013;<lpage>423</lpage>. <pub-id pub-id-type="doi">10.1016/0016-5085(92)90829-n</pub-id> </citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Visvader</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Stingl</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Mammary Stem Cells and the Differentiation Hierarchy: Current Status and Perspectives</article-title>. <source>Genes. Dev.</source> <volume>28</volume> (<issue>11</issue>), <fpage>1143</fpage>&#x2013;<lpage>1158</lpage>. <pub-id pub-id-type="doi">10.1101/gad.242511.114</pub-id> </citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vranic</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gatalica</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z. Y.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Update on the Molecular Profile of the MDA-MB-453 Cell Line as a Model for Apocrine Breast Carcinoma Studies</article-title>. <source>Oncol. Lett.</source> <volume>2</volume> (<issue>6</issue>), <fpage>1131</fpage>&#x2013;<lpage>1137</lpage>. <pub-id pub-id-type="doi">10.3892/ol.2011.375</pub-id> </citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hayward</surname>
<given-names>S. W.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Thayer</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Cunha</surname>
<given-names>G. R.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Cell Differentiation Lineage in the Prostate</article-title>. <source>Differentiation</source> <volume>68</volume> (<issue>4-5</issue>), <fpage>270</fpage>&#x2013;<lpage>279</lpage>. </citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>The Diagnostic Value of Serum HE4 and CA-125 and ROMA Index in Ovarian Cancer</article-title>. <source>Biomed. Rep.</source> <volume>5</volume> (<issue>1</issue>), <fpage>41</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.3892/br.2016.682</pub-id> </citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>clusterProfiler 4.0: A Universal Enrichment Tool for Interpreting Omics Data</article-title>. <source>Innovation</source> <volume>2</volume> (<issue>3</issue>), <fpage>100141</fpage>. <pub-id pub-id-type="doi">10.1016/j.xinn.2021.100141</pub-id> </citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xia</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Aji</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Organoid Technology in Cancer Precision Medicine</article-title>. <source>Cancer Lett.</source> <volume>457</volume>, <fpage>20</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1016/j.canlet.2019.04.039</pub-id> </citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A Comparison for Dimensionality Reduction Methods of Single-Cell RNA-Seq Data</article-title>. <source>Front. Genet.</source> <volume>12</volume>, <fpage>646936</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2021.646936</pub-id> </citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiong</surname>
<given-names>D.-d.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>C.-m.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>D.-z.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Ki-67/MKI67 as a Predictive Biomarker for Clinical Outcome in Gastric Cancer Patients: an Updated Meta-Analysis and Systematic Review Involving 53 Studies and 7078 Patients</article-title>. <source>J. Cancer</source> <volume>10</volume> (<issue>22</issue>), <fpage>5339</fpage>&#x2013;<lpage>5354</lpage>. <pub-id pub-id-type="doi">10.7150/jca.30074</pub-id> </citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Lyu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Organoid Technology and Applications in Cancer Research</article-title>. <source>J. Hematol. Oncol.</source> <volume>11</volume> (<issue>1</issue>), <fpage>116</fpage>. <pub-id pub-id-type="doi">10.1186/s13045-018-0662-9</pub-id> </citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Single-cell RNA Sequencing Reveals Cell Heterogeneity and Transcriptome Profile of Breast Cancer Lymph Node Metastasis</article-title>. <source>Oncogenesis</source> <volume>10</volume> (<issue>10</issue>), <fpage>66</fpage>. <pub-id pub-id-type="doi">10.1038/s41389-021-00355-6</pub-id> </citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Xue</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Prognostic Value of Different Amounts of Cancer Stem Cells in Different Molecular Subtypes of Breast Cancer</article-title>. <source>Gland. Surg.</source> <volume>1</volume> (<issue>1</issue>), <fpage>20</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.3978/j.issn.2227-684X.2012.04.02</pub-id> </citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jiao</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Mammary Gland Stem Cells and Their Application in Breast Cancer</article-title>. <source>Oncotarget</source> <volume>8</volume> (<issue>6</issue>), <fpage>10675</fpage>&#x2013;<lpage>10691</lpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.12893</pub-id> </citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Malhotra</surname>
<given-names>G. K.</given-names>
</name>
<name>
<surname>Lele</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Lele</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>West</surname>
<given-names>W. W.</given-names>
</name>
<name>
<surname>Eudy</surname>
<given-names>J. D.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>Telomerase-immortalized Human Mammary Stem/progenitor Cells with Ability to Self-Renew and Differentiate</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>107</volume> (<issue>32</issue>), <fpage>14146</fpage>&#x2013;<lpage>14151</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1009030107</pub-id> </citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname>
<given-names>G. X. Y.</given-names>
</name>
<name>
<surname>Terry</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Belgrader</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ryvkin</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Bent</surname>
<given-names>Z. W.</given-names>
</name>
<name>
<surname>Wilson</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Massively Parallel Digital Transcriptional Profiling of Single Cells</article-title>. <source>Nat. Commun.</source> <volume>8</volume>, <fpage>14049</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms14049</pub-id> </citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Zou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Stem Cells and Cellular Origins of Mammary Gland: Updates in Rationale, Controversies, and Cancer Relevance</article-title>. <source>Stem Cells Int.</source> <volume>2019</volume>, <fpage>4247168</fpage>. <pub-id pub-id-type="doi">10.1155/2019/4247168</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>