<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Appl. Math. Stat.</journal-id>
<journal-title>Frontiers in Applied Mathematics and Statistics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Appl. Math. Stat.</abbrev-journal-title>
<issn pub-type="epub">2297-4687</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fams.2024.1403901</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Applied Mathematics and Statistics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Analysis of community connectivity in spatial transcriptomics data</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Xie</surname> <given-names>Juan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Jung</surname> <given-names>Kyeong Joo</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Allen</surname> <given-names>Carter</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2760577/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Chang</surname> <given-names>Yuzhou</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1691639/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Paul</surname> <given-names>Subhadeep</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/739234/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Zihai</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2038161/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Ma</surname> <given-names>Qin</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/748441/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chung</surname> <given-names>Dongjun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/231646/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>The Interdisciplinary Ph.D. Program in Biostatistics, The Ohio State University</institution>, <addr-line>Columbus, OH</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Biomedical Informatics, The Ohio State University</institution>, <addr-line>Columbus, OH</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>Pelotonia Institute for Immuno-Oncology, The James Comprehensive Cancer Center, The Ohio State University</institution>, <addr-line>Columbus, OH</addr-line>, <country>United States</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Computer Science and Engineering, The Ohio State University</institution>, <addr-line>Columbus, OH</addr-line>, <country>United States</country></aff>
<aff id="aff5"><sup>5</sup><institution>Global Statistical Sciences, Eli Lilly and Company</institution>, <addr-line>Indianapolis, IN</addr-line>, <country>United States</country></aff>
<aff id="aff6"><sup>6</sup><institution>Department of Statistics, The Ohio State University</institution>, <addr-line>Columbus, OH</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Qiwei Li, The University of Texas at Dallas, United States</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Xiangyu Luo, Renmin University of China, China</p>
<p>Ying Ma, Brown University, United States</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Dongjun Chung <email>chung.911&#x00040;osu.edu</email></corresp>
<fn fn-type="equal" id="fn001"><p>&#x02020;These authors have contributed equally to this work</p></fn></author-notes>
<pub-date pub-type="epub">
<day>12</day>
<month>07</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>10</volume>
<elocation-id>1403901</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>03</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>01</day>
<month>07</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2024 Xie, Jung, Allen, Chang, Paul, Li, Ma and Chung.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Xie, Jung, Allen, Chang, Paul, Li, Ma and Chung</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>The advent of high throughput spatial transcriptomics (HST) has allowed for unprecedented characterization of spatially distinct cell communities within a tissue sample. While a wide range of computational tools exist for detecting cell communities in HST data, none allow for the characterization of community connectivity, i.e., the relative similarity of cells within and between found communities&#x02014;an analysis task that can elucidate cellular dynamics in important settings such as the tumor microenvironment.</p></sec>
<sec>
<title>Methods</title>
<p>To address this gap, we introduce the analysis of community connectivity (ACC), which facilitates understanding of the relative similarity of cells within and between communities. We develop a Bayesian multi-layer network model called BANYAN for the integration of spatial and gene expression information to achieve ACC.</p></sec>
<sec>
<title>Results</title>
<p>We demonstrate BANYAN&#x00027;s ability to recover community connectivity structure via a simulation study based on real sagittal mouse brain HST data. Next, we use BANYAN to implement ACC across a wide range of real data scenarios, including 10 &#x000D7; Visium data of melanoma brain metastases and invasive ductal carcinoma, and NanoString CosMx data of human-small-cell lung cancer, each of which reveals distinct cliques of interacting cell sub-populations. An <monospace>R</monospace> package <monospace>banyan</monospace> is available at <ext-link ext-link-type="uri" xlink:href="https://github.com/dongjunchung/banyan">https://github.com/dongjunchung/banyan</ext-link>.</p></sec></abstract>
<kwd-group>
<kwd>spatial transcriptomics</kwd>
<kwd>analysis of community connectivity</kwd>
<kwd>stochastic block model</kwd>
<kwd>Bayesian models</kwd>
<kwd>network analysis</kwd>
</kwd-group>
<contract-num rid="cn001">R21 HG012482</contract-num>
<contract-num rid="cn002">R01 GM122078</contract-num>
<contract-num rid="cn002">R01 GM131399</contract-num>
<contract-num rid="cn003">U01 DA045300</contract-num>
<contract-num rid="cn004">U54 AG075931</contract-num>
<contract-num rid="cn005">NSF1945971</contract-num>
<contract-sponsor id="cn001">National Human Genome Research Institute<named-content content-type="fundref-id">10.13039/100000051</named-content></contract-sponsor>
<contract-sponsor id="cn002">National Institute of General Medical Sciences<named-content content-type="fundref-id">10.13039/100000057</named-content></contract-sponsor>
<contract-sponsor id="cn003">National Institute on Drug Abuse<named-content content-type="fundref-id">10.13039/100000026</named-content></contract-sponsor>
<contract-sponsor id="cn004">National Institute on Aging<named-content content-type="fundref-id">10.13039/100000049</named-content></contract-sponsor>
<contract-sponsor id="cn005">National Science Foundation<named-content content-type="fundref-id">10.13039/100000001</named-content></contract-sponsor>
<counts>
<fig-count count="5"/>
<table-count count="0"/>
<equation-count count="5"/>
<ref-count count="47"/>
<page-count count="13"/>
<word-count count="7884"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Statistics and Probability</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>1 Introduction</title>
<p>The advent of spatial transcriptomics has allowed for unprecedented characterization of tissue architecture in terms of spatially resolved transcript abundance [<xref ref-type="bibr" rid="B1">1</xref>]. In particular, <italic>high throughput spatial transcriptomics</italic> (HST) technologies, such as the 10 &#x000D7; Visium platform, have become popular due to their deeper transcriptome-wide sequencing depth. The proliferation of HST data has led to the development of several computational tools for discerning cell sub-populations in HST data while considering both gene expression and spatial information. The existing tools span a range of methodological categories, including neural networks [<xref ref-type="bibr" rid="B2">2</xref>&#x02013;<xref ref-type="bibr" rid="B4">4</xref>], graph clustering algorithms [<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>], and Bayesian statistical models [<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>].</p>
<p>These methods are fundamentally limited in that they do not explicitly model the interactive nature of cell sub-populations in a tissue sample [<xref ref-type="bibr" rid="B9">9</xref>]. In other words, the sub-populations derived from existing methods are considered static, and no information is provided on how they relate to one another. Meanwhile, it is known that communication within and between groups of cells is a fundamental driver of healthy and diseased processes in complex tissue [<xref ref-type="bibr" rid="B10">10</xref>]. Moreover, Canozo et al. [<xref ref-type="bibr" rid="B4">4</xref>] report substantial heterogeneity within traditional mouse olfactory bulb layer annotations, driven in part by spatial variation in intercellular communication patterns. However, detecting higher resolution cell sup-populations with existing tools is challenging as there is a lack of model-based methodology for determining which cell sup-populations may be members of a common broader phenotype (e.g., immune or cancer cell sub-types) based on similar yet distinct gene expression or spatial location patterns. As a consequence, current tools cannot be used to study the <italic>community connectivity structure</italic> of cell sub-populations, i.e., the relative similarity among cells within and between sub-populations.</p>
<p>By studying community connectivity structure, we may obtain valuable insights into the interactive dynamics and spatial heterogeneity of cell sup-populations in challenging settings such as the tumor microenvironment. For example, instead of simply labeling categories of immune cells and cancer cells in a tumor, we may quantify how these important cell sub-populations relate to one another, and how tertiary intermediate sub-populations may be mediating important dynamics within the tumor microenvironment. Furthermore, characterizing community connectivity structure may help inform more biologically informative annotations of ambiguous sub-populations by relating them to more clearly defined sub-populations. Doing so may allow for a more holistic interpretation of all HST cell clusters in the common case when only a few cell clusters correspond clearly to a known cell type.</p>
<p>To address these gaps, we propose BANYAN (<bold>B</bold>ayesian <bold>AN</bold>alysis of communit<bold>Y</bold> connectivity in sp<bold>A</bold>tial single-cell <bold>N</bold>etworks): a Bayesian statistical network model capable of discerning community connectivity structure in HST data. BANYAN draws inspiration from the vast field of biological network analysis [<xref ref-type="bibr" rid="B11">11</xref>], and is built on the supposition that HST data is most accurately represented as similarity networks that reflect similarity between cell spots in terms of spatial location and transcriptional profiles. As opposed to simple comparisons of marker gene expression across cell sub-populations, quantification of similarity metrics can more effectively represent the information contained in thousands of gene markers. To this end, BANYAN introduces a Bayesian multi-layer stochastic block model [<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B13">13</xref>] that infers a community connectivity structure to characterize the relationships between cell spots both within and between sub-populations, based jointly on transcriptional and spatial similarity between cell spots. We offer convenient implementation and interactive visualization functionality via the <monospace>R</monospace> package <monospace>BANYAN</monospace>.</p></sec>
<sec sec-type="methods" id="s2">
<title>2 Methods</title>
<p>BANYAN is the first HST computational tool to allow for <italic>analysis of community connectivity</italic> (ACC), i.e., the process of inferring the similarity of cell spots within and between sub-populations. A graphical representation is given in <xref ref-type="fig" rid="F1">Figure 1</xref>, and the workflow to achieve ACC can be summarized as follows. First, given cell spot-level gene expression features and spatial coordinate data from HST platforms, we construct two spot-spot nearest neighbor networks. These networks are then integrated into a multi-layer graph data structure. Then, we fit a Bayesian multi-layer stochastic block model (MLSBM), which assumes that spatial location and gene expression patterns of cell spots arise from a common community structure. The estimated parameters from this model allow us to infer the community structure of the tissue sample by quantifying the relative similarity between cell spots within and between sub-populations.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>BANYAN introduces the analysis of community connectivity. Spatial transcriptomics platforms yield gene expression and spatial coordinate matrices, which may be used to construct spot-spot nearest neighbor networks that describe how cell spots are similar in terms of gene expression or spatial information. These network structures are passed to a multi-layer stochastic block model (MLSBM). Analysis of community connectivity is achieved through estimation of MLSBM connectivity parameters <inline-formula><mml:math id="M1"><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mstyle mathvariant='bold'><mml:mi>&#x00398;</mml:mi></mml:mstyle></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>K</mml:mi><mml:mo>&#x000D7;</mml:mo><mml:mi>K</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fams-10-1403901-g0001.tif"/>
</fig>
<sec>
<title>2.1 Data pre-processing</title>
<p>To represent the interactive nature of cells and cell types, we adopt two cell-cell similarity networks as our primary data objects: one for gene expression and another for spatial location. To form the cell spot-cell spot gene expression similarity network, we first apply standard pre-processing steps including scaling, removal of technical artifacts, and identification of highly variable genes [<xref ref-type="bibr" rid="B14">14</xref>&#x02013;<xref ref-type="bibr" rid="B16">16</xref>]. We then embed each of the <italic>N</italic> total cell spots in a lower-dimensional space using principal components analysis (PCA) applied to the top 2,000 most variable genes. To form the cell spot-cell spot gene expression similarity matrix, we represent each cell spot as a node and connect each cell spot to its <italic>R</italic> closest neighboring cell spots in the gene expression principal component space using a binary edge. We utilize the same approach to construct the spatial cell spot-cell spot similarity network, where principal components are replaced with 2-dimensional spatial coordinates. The resultant data structure is two networks with <italic>N</italic> nodes, each of degree <italic>R</italic>. By default, we adopt the widely used heuristic of choosing <italic>R</italic> as the closest odd integer to <inline-formula><mml:math id="M2"><mml:msqrt><mml:mrow><mml:mi>N</mml:mi></mml:mrow></mml:msqrt></mml:math></inline-formula> [<xref ref-type="bibr" rid="B17">17</xref>], which allows the number of neighboring spots to increase as the size of the tissue sample increases. With the typical HST experiment yielding a total number of cell spots between 2,000 and 3,000, this heuristic leads to consideration of between third- and fourth-order neighborhood structures (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S1</xref>). Overall, we view <italic>R</italic> as a tuning parameter that may be adjusted depending on the amount of information sharing desired across a tissue sample.</p>
</sec>
<sec>
<title>2.2 Model</title>
<p>We develop the core statistical model within BANYAN as an extension of the widely used stochastic block model [<xref ref-type="bibr" rid="B18">18</xref>], a flexible generative model for network data that allows for the assessment of community structure based on the frequency of binary edges among and between subsets of nodes. We define <bold>A</bold><sup>1</sup> as the <italic>N</italic> &#x000D7; <italic>N</italic> binary adjacency matrix encoding the gene expression similarity network, and <bold>A</bold><sup>2</sup> as the binary adjacency matrix encoding the spatial similarity network. The matrix elements <inline-formula><mml:math id="M3"><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup></mml:math></inline-formula> and <inline-formula><mml:math id="M4"><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup></mml:math></inline-formula> indicate the presence or absence of a binary un-directed edge between nodes <italic>i</italic> and <italic>j</italic> for gene expression and spatial information, respectively. We define <inline-formula><mml:math id="M5"><mml:mrow><mml:mstyle mathvariant="script"><mml:mi>A</mml:mi></mml:mstyle></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:msup><mml:mrow><mml:mstyle mathvariant='bold'><mml:mtext>A</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msup><mml:mo>,</mml:mo><mml:msup><mml:mrow><mml:mstyle mathvariant='bold'><mml:mtext>A</mml:mtext></mml:mstyle></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:math></inline-formula> as the multi-layer graph that encodes similarity between cell spots in terms of both gene expression and spatial information. While we focus on the integration of spatial and gene expression information, our proposed framework may be extended to <italic>L</italic> layers to incorporate other sources of information from multiplexed experimental assays.</p>
<p>Given the multi-layer graph data <inline-formula><mml:math id="M6"><mml:mrow><mml:mstyle mathvariant="script"><mml:mi>A</mml:mi></mml:mstyle></mml:mrow></mml:math></inline-formula>, we assume that the absence or presence of edges in each layer between each pair of nodes <italic>i</italic> and <italic>j</italic> follows a Bernoulli distribution with probability of an edge <italic>&#x003B8;</italic><sub><italic>z</italic><sub><italic>i</italic></sub>, <italic>z</italic><sub><italic>j</italic></sub></sub>, where <italic>z</italic><sub><italic>i</italic></sub> &#x02208; {1, ..., <italic>K</italic>} denotes the latent cell spot sub-population assignment for cell spot <italic>i</italic>. We refer to such a model as MLSBM. Formally, we assume for <italic>l</italic> &#x0003D; 1, 2,</p>
<disp-formula id="E1"><label>(1)</label><mml:math id="M7"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msubsup><mml:mo>|</mml:mo><mml:mstyle mathvariant='bold'><mml:mtext>z</mml:mtext></mml:mstyle><mml:mo>,</mml:mo><mml:mstyle mathvariant='bold'><mml:mi>&#x00398;</mml:mi></mml:mstyle><mml:mover class="stackrel"><mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mrow><mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>d</mml:mi></mml:mrow></mml:mrow></mml:mover><mml:mtext class="textrm" mathvariant="normal">Bernoulli</mml:mtext><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mtext>&#x000A0;for&#x000A0;</mml:mtext><mml:mi>i</mml:mi><mml:mo>&#x0003C;</mml:mo><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mo>.</mml:mo><mml:mo>.</mml:mo><mml:mo>.</mml:mo><mml:mo>,</mml:mo><mml:mi>N</mml:mi><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <bold>z</bold> &#x0003D; (<italic>z</italic><sub>1</sub>, ..., <italic>z</italic><sub><italic>N</italic></sub>), and <bold>&#x00398;</bold> is a <italic>K</italic> &#x000D7; <italic>K</italic> <italic>connectivity matrix</italic> with diagonal elements <italic>&#x003B8;</italic><sub><italic>rs</italic></sub> for <italic>r</italic> &#x0003D; <italic>s</italic> &#x0003D; 1, ..., <italic>K</italic> controlling the probability of an edge occurring between two cell spots in the same sub-population, and off-diagonal elements <italic>&#x003B8;</italic><sub><italic>rs</italic></sub> for <italic>r</italic> &#x0003C; <italic>s</italic> &#x0003D; 1, ..., <italic>K</italic> controlling the probability of an edge occurring between two nodes in different cell spot sub-populations. Importantly, Model (<xref ref-type="disp-formula" rid="E1">1</xref>) implies that connections among cell spots in the gene expression and spatial layers are governed by a common set of community structure parameters <bold>z</bold> and <bold>&#x00398;</bold>. Note that in the graph <inline-formula><mml:math id="M8"><mml:mrow><mml:mstyle mathvariant="script"><mml:mi>A</mml:mi></mml:mstyle></mml:mrow></mml:math></inline-formula>, the edges corresponding to the cases that <inline-formula><mml:math id="M9"><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:math></inline-formula> and <inline-formula><mml:math id="M10"><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:math></inline-formula> usually constitute the core of the community, while the edges corresponding to the cases that <inline-formula><mml:math id="M11"><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:math></inline-formula> and <inline-formula><mml:math id="M12"><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:math></inline-formula>, or <inline-formula><mml:math id="M13"><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:math></inline-formula> and <inline-formula><mml:math id="M14"><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:math></inline-formula>, usually constitute the outskirts of the community. Given Model (<xref ref-type="disp-formula" rid="E1">1</xref>) and data <inline-formula><mml:math id="M15"><mml:mrow><mml:mstyle mathvariant="script"><mml:mi>A</mml:mi></mml:mstyle></mml:mrow></mml:math></inline-formula>, our primary inferential objective is to characterize the cell spot-cell spot interaction both <italic>within</italic> and <italic>between</italic> them by estimating the parameters <bold>&#x00398;</bold>, which we accomplish using a Bayesian approach as described below.</p>
</sec>
<sec>
<title>2.3 Bayesian inference</title>
<sec>
<title>2.3.1 Priors</title>
<p>To achieve a fully Bayesian parameter estimation scheme, we assign prior distributions to all model parameters. We adopt available conjugate priors to obtain closed-form full conditional distributions of all model parameters, allowing for straightforward Gibbs sampling. For the latent cell sub-population indicators <italic>z</italic><sub>1</sub>, ..., <italic>z</italic><sub><italic>N</italic></sub>, we assume a conjugate multinomial-Dirichlet prior with <inline-formula><mml:math id="M16"><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mover class="stackrel"><mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mrow><mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>i</mml:mi><mml:mi>d</mml:mi></mml:mrow></mml:mrow></mml:mover><mml:mstyle class="text"><mml:mtext class="textrm" mathvariant="normal">Categorical</mml:mtext></mml:mstyle><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle mathvariant='bold'><mml:mi>&#x003C0;</mml:mi></mml:mstyle></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> for <italic>i</italic> &#x0003D; 1, ..., <italic>N</italic>, and <bold>&#x003C0;</bold> &#x0007E; Dirichlet(&#x003B1;<sub>1</sub>, ..., &#x003B1;<sub><italic>K</italic></sub>), where <bold>&#x003C0;</bold> &#x0003D; (&#x003C0;<sub>1</sub>, ..., &#x003C0;<sub><italic>K</italic></sub>) controls the relative size of each cell sub-population to allow for a heterogeneous distribution of cell type abundances. We adopt a conjugate Beta-Bernoulli prior for <bold>&#x00398;</bold> by assuming <inline-formula><mml:math id="M17"><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mover class="stackrel"><mml:mrow><mml:mo>&#x0007E;</mml:mo></mml:mrow><mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>i</mml:mi><mml:mi>d</mml:mi></mml:mrow></mml:mrow></mml:mover><mml:mstyle class="text"><mml:mtext class="textrm" mathvariant="normal">Beta</mml:mtext></mml:mstyle><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>&#x003B2;</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003B2;</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> for <italic>r</italic> &#x0003C; <italic>s</italic> &#x0003D; 1, ..., <italic>K</italic>. As a default, we opt for weakly informative priors by setting &#x003B1;<sub>1</sub> &#x0003D; &#x003B1;<sub>2</sub> &#x0003D;... &#x0003D; &#x003B1;<sub><italic>K</italic></sub> &#x0003D; 1 and &#x003B2;<sub>1</sub> &#x0003D; &#x003B2;<sub>2</sub> &#x0003D; 1 [<xref ref-type="bibr" rid="B19">19</xref>].</p></sec>
<sec>
<title>2.3.2 Markov chain Monte Carlo (MCMC) algorithm</title>
<p>The model proposed in Sections 2.2 and 2.3.1 allows for closed-form full conditional distributions of all model parameters. Thus, we adopt the following Gibbs sampling algorithm for parameter estimation. In practice, we recommend initializing the indicators <italic>z</italic><sub><italic>i</italic></sub>, ..., <italic>z</italic><sub><italic>N</italic></sub> using a heuristic graph clustering method such as the Louvain algorithm [<xref ref-type="bibr" rid="B20">20</xref>] applied to <bold>A</bold><sup>1</sup> to facilitate timely model convergence.</p>
<list list-type="order">
<list-item><p>Update <bold>&#x003C0;</bold> from its full conditional (<bold>&#x003C0;</bold>|<bold>A</bold>, <bold>z</bold>, <bold>&#x00398;</bold>) &#x0007E; Dirichlet(<italic>a</italic><sub>1</sub>, ..., <italic>a</italic><sub><italic>K</italic></sub>), where <italic>a</italic><sub><italic>k</italic></sub> &#x0003D; &#x003B1;<sub><italic>k</italic></sub>&#x0002B;<italic>n</italic><sub><italic>k</italic></sub>, and <italic>n</italic><sub><italic>k</italic></sub> is the number of nodes assigned to cell sub-population <italic>k</italic> at the current MCMC iteration, i.e., <inline-formula><mml:math id="M18"><mml:msub><mml:mrow><mml:mi>n</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>N</mml:mi></mml:mrow></mml:munderover><mml:msub><mml:mrow><mml:mi>I</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>.</p></list-item>
<list-item><p>For <italic>r</italic> &#x02264; <italic>s</italic> &#x0003D; 1, ..., <italic>K</italic>, update <italic>&#x003B8;</italic><sub><italic>rs</italic></sub> from</p>
<p><disp-formula id="E2"><mml:math id="M19"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo><mml:mstyle mathvariant='bold'><mml:mtext>A</mml:mtext></mml:mstyle><mml:mo>,</mml:mo><mml:mstyle mathvariant='bold'><mml:mtext>z</mml:mtext></mml:mstyle><mml:mo>,</mml:mo><mml:mstyle mathvariant='bold'><mml:mi>&#x003C0;</mml:mi></mml:mstyle></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>&#x0007E;</mml:mo><mml:mtext class="textrm" mathvariant="normal">Beta</mml:mtext><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>&#x003B2;</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:mi>A</mml:mi><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:mi>r</mml:mi><mml:mi>s</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003B2;</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>&#x0002B;</mml:mo><mml:msub><mml:mrow><mml:mi>n</mml:mi></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02212;</mml:mo><mml:mi>A</mml:mi><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:mi>r</mml:mi><mml:mi>s</mml:mi></mml:mrow><mml:mo>]</mml:mo></mml:mrow></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p>
<p>where <italic>A</italic>[<italic>rs</italic>] are the number of observed edges between communities <italic>r</italic> and <italic>s</italic> across both layers, and <italic>n</italic><sub><italic>rs</italic></sub> &#x0003D; 2(<italic>n</italic><sub><italic>r</italic></sub><italic>n</italic><sub><italic>s</italic></sub>&#x02212;<italic>n</italic><sub><italic>r</italic></sub><italic>I</italic>(<italic>r</italic> &#x0003D; <italic>s</italic>)) are the number of possible edges between communities <italic>r</italic> and <italic>s</italic>, <italic>n</italic><sub><italic>r</italic></sub> is the number of nodes assigned to cell sup-population <italic>r</italic>, and <italic>I</italic>(<italic>r</italic> &#x0003D; <italic>s</italic>) is the indicator function equal to 1 if <italic>r</italic> &#x0003D; <italic>s</italic> and 0 otherwise.</p></list-item>
<list-item><p>For <italic>i</italic> &#x0003D; 1, ..., <italic>N</italic>, update <italic>z</italic><sub><italic>i</italic></sub> from (<italic>z</italic><sub><italic>i</italic></sub>|<italic>z</italic><sub>&#x02212;<italic>i</italic></sub>, <bold>A</bold>, <bold>&#x003C0;</bold>, <bold>&#x00398;</bold>) &#x0007E; Categorical(<bold>&#x003C1;</bold><sub><italic>i</italic></sub>), where <bold>&#x003C1;</bold><sub><italic>i</italic></sub> &#x0003D; (&#x003C1;<sub><italic>i</italic>1</sub>, ..., &#x003C1;<sub><italic>iK</italic></sub>) and</p>
<p><disp-formula id="E3"><mml:math id="M20"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003C1;</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003C0;</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="true">(</mml:mo><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x0220F;</mml:mo></mml:mrow><mml:mrow><mml:mi>l</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munder class="msub"><mml:mrow><mml:mo>&#x0220F;</mml:mo></mml:mrow><mml:mrow><mml:mi>j</mml:mi><mml:mo>&#x02260;</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:munder></mml:mstyle><mml:msubsup><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:msubsup><mml:msup><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x02212;</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x02212;</mml:mo><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:msup></mml:mrow><mml:mo stretchy="true">)</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mo>&#x02003;&#x02003;</mml:mo><mml:mrow><mml:mo stretchy="true">(</mml:mo><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x0220F;</mml:mo></mml:mrow><mml:mrow><mml:mi>l</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:munderover></mml:mstyle><mml:mstyle displaystyle="true"><mml:munder class="msub"><mml:mrow><mml:mo>&#x0220F;</mml:mo></mml:mrow><mml:mrow><mml:mi>h</mml:mi><mml:mo>&#x02260;</mml:mo><mml:mi>i</mml:mi></mml:mrow></mml:munder></mml:mstyle><mml:msubsup><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>h</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mi>k</mml:mi></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>h</mml:mi><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:msubsup><mml:msup><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x02212;</mml:mo><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mi>h</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x02212;</mml:mo><mml:msubsup><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mi>h</mml:mi><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>l</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:msup></mml:mrow><mml:mo stretchy="true">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula></p></list-item>
</list>
</sec>
<sec>
<title>2.3.3 Label switching</title>
<p>Label switching is a ubiquitous issue faced by models whose likelihood is invariant to permutations of a latent categorical variable such as <bold>z</bold>. Consequently, stochastically equivalent permutations of <bold>z</bold> may occur over the course of MCMC sampling, causing the estimates of all community-specific parameters to be conflated, thereby jeopardizing the accuracy of model parameter estimates. Previous approaches for addressing label switching rely on re-shuffling posterior samples after completion of the MCMC algorithm [<xref ref-type="bibr" rid="B21">21</xref>]. However, such methods rely on prediction and are subject to prediction error. To protect against label switching within the MCMC sampler, we adopt the canonical projection of <bold>z</bold> proposed by Peng and Carvalho [<xref ref-type="bibr" rid="B22">22</xref>], who restrict updates of <bold>z</bold> to the reduced sample space <inline-formula><mml:math id="M21"><mml:mrow><mml:mstyle mathvariant="script"><mml:mi>Z</mml:mi></mml:mstyle></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:mstyle mathvariant='bold'><mml:mtext>z</mml:mtext></mml:mstyle><mml:mo>:</mml:mo><mml:mstyle class="text"><mml:mtext class="textrm" mathvariant="normal">ord</mml:mtext></mml:mstyle><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mstyle mathvariant='bold'><mml:mtext>z</mml:mtext></mml:mstyle></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mo>.</mml:mo><mml:mo>.</mml:mo><mml:mo>.</mml:mo><mml:mo>,</mml:mo><mml:mi>K</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:math></inline-formula>, wherein label switching is less likely due to the restricted sample space. In practice, we manually permute <bold>z</bold> at each MCMC iteration such that community 1 appears first in <bold>z</bold>, community 2 appears second in <bold>z</bold>, <italic>et cetera</italic>. Finally, we estimate <bold>z</bold> using the maximum <italic>a posteriori</italic> (MAP) estimate across all post-burn MCMC samples [<xref ref-type="bibr" rid="B19">19</xref>].</p>
</sec>
</sec>
<sec>
<title>2.4 Analysis of community connectivity</title>
<p>Estimation of the MLSBM model parameters <bold>&#x00398;</bold> with the corresponding maximum <italic>a posteriori</italic> estimates <inline-formula><mml:math id="M22"><mml:mover accent="true"><mml:mrow><mml:mstyle mathvariant='bold'><mml:mi>&#x00398;</mml:mi></mml:mstyle></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:math></inline-formula> allows for inference of community connectivity structure in HST data. While the estimated community labeling vector <inline-formula><mml:math id="M23"><mml:mover accent="true"><mml:mrow><mml:mstyle mathvariant='bold'><mml:mtext>z</mml:mtext></mml:mstyle></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:math></inline-formula> is what we use to define communities, the elements of <inline-formula><mml:math id="M24"><mml:mover accent="true"><mml:mrow><mml:mstyle mathvariant='bold'><mml:mi>&#x00398;</mml:mi></mml:mstyle></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:math></inline-formula> describe how cell spots within and between communities relate to one another, thereby characterizing community connectivity. Specifically, elements <inline-formula><mml:math id="M25"><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> reflect the estimated probability of a randomly chosen cell spot in community <italic>r</italic> sharing a nearest neighbors edge in <inline-formula><mml:math id="M26"><mml:mrow><mml:mstyle mathvariant="script"><mml:mi>A</mml:mi></mml:mstyle></mml:mrow></mml:math></inline-formula> with a cell spot in community <italic>s</italic>. When <italic>r</italic> &#x0003D; <italic>s</italic>, <inline-formula><mml:math id="M27"><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> reflects the average connectivity within a community, which may be used to assess the relative homogeneity of a community. Heterogeneous communities tend to have lower average within-community connectivity, while more homogeneous communities tend to have higher within-community connectivity. Likewise, when <italic>r</italic> &#x02260; <italic>s</italic>, <inline-formula><mml:math id="M28"><mml:msub><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mo>^</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>r</mml:mi><mml:mi>s</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> represents the probability of connection between cell spots in two distinct communities. This between-community connectivity measurement allows us to discern closely related communities that may contain similar cell types from more distinct communities. Taken together, these between and within-community connectivity parameters capacitate analysis of community connectivity.</p>
</sec>
<sec>
<title>2.5 Software implementation</title>
<p>We provide the <monospace>R</monospace> package <monospace>banyan</monospace> for convenient implementation of the proposed workflow. The <monospace>banyan</monospace> package efficiently implements Bayesian estimation using custom Gibbs sampling algorithms implemented in <monospace>C&#x0002B;&#x0002B;</monospace> using <monospace>Rcpp</monospace>. The core model fitting functions integrate seamlessly with standard Seurat [<xref ref-type="bibr" rid="B23">23</xref>] data structures, allowing users to easily incorporate ACC into existing HST analysis workflows. Further, <monospace>banyan</monospace> allows users to investigate community connectivity using external sub-population labels, thereby encouraging widespread utility of ACC. As clustering algorithms for HST proliferate&#x02014;each with different assumptions and optimal use cases, utilizing BANYAN for <italic>post-hoc</italic> community connectivity analysis will help elucidate tissue heterogeneity across the widest possible range of application settings. We developed both interactive and static visualization functions for interrogation of BANYAN sub-population labels and community connectivity structure. The <monospace>banyan</monospace> package interfaces seamlessly with standard <monospace>Seurat</monospace> workflows, and is freely available at <ext-link ext-link-type="uri" xlink:href="https://github.com/dongjunchung/banyan">https://github.com/dongjunchung/banyan</ext-link>.</p></sec></sec>
<sec id="s3">
<title>3 Result</title>
<sec>
<title>3.1 Simulation studies show BANYAN effectively identifies underlying community connectivity structures under a broad range of signal-to-noise ratio settings</title>
<p>We designed a simulation study to validate the performance of the MLSBM employed by BANYAN. We adopted a publicly available sagittal mouse brain data set [<xref ref-type="bibr" rid="B24">24</xref>] sequenced with the 10&#x000D7; Visium platform. In our simulation data, we manually allocated the <italic>N</italic> = 2,696 total cell spots in the original sagital mouse brain data set into five spatially contiguous mouse brain layers. Assuming that a community structure is given as</p>
<disp-formula id="E4"><mml:math id="M29"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:mstyle mathvariant='bold'><mml:mi>&#x00398;</mml:mi></mml:mstyle><mml:mo>=</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:mtable style="text-align:axis;" equalrows="false" columnlines="none none none none none none none none none" equalcolumns="false" class="array"><mml:mtr><mml:mtd><mml:mi>&#x003B8;</mml:mi></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mi>&#x003B8;</mml:mi></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mi>&#x003B8;</mml:mi></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mi>&#x003B8;</mml:mi></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mn>0</mml:mn><mml:mo>.</mml:mo><mml:mn>1</mml:mn></mml:mtd><mml:mtd><mml:mi>&#x003B8;</mml:mi></mml:mtd></mml:mtr></mml:mtable></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>we defined the <italic>signal-to-noise ratio</italic> (SNR) of the simulated gene expression network as SNR &#x0003D; <italic>&#x003B8;</italic>/0.1, i.e., the ratio of the within- to between-community connectivity. SNR values much greater than 1 give rise to a strong community structure in the simulated data, while SNR values close to 1 result in a weaker community structure. We do not consider values of SNR below 1, as the resultant disassortative community structure is not reflective of cell type structure in HST data. In addition, we note that SNR was close to 10 in all the real data applications we consider in the following sections, i.e., the ranges of SNR we considered in these simulation studies are significantly lower than those we observe in real datasets. Hence, given the usual SNR levels we observe in real datasets, BANYAN is expected to effectively recover the underlying community connectivity structure.</p>
<p>We explore the effects of varying between-community connectivity and within-community connectivity to modulate the signals-to-noise ratio (SNR). We used the general community structure given by</p>
<disp-formula id="E5"><label>(2)</label><mml:math id="M30"><mml:mtable class="eqnarray" columnalign="left"><mml:mtr><mml:mtd><mml:mstyle mathvariant='bold'><mml:mi>&#x00398;</mml:mi></mml:mstyle><mml:mo>=</mml:mo><mml:mrow><mml:mo>[</mml:mo><mml:mrow><mml:mtable style="text-align:axis;" equalrows="false" columnlines="none none none none none none none none none" equalcolumns="false" class="array"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>11</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>12</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>13</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>14</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>15</mml:mn></mml:mrow></mml:msub></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>21</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>22</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>23</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>24</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>25</mml:mn></mml:mrow></mml:msub></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>31</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>32</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>33</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>34</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>35</mml:mn></mml:mrow></mml:msub></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>41</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>42</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>43</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>44</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>45</mml:mn></mml:mrow></mml:msub></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>51</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>52</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>53</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>54</mml:mn></mml:mrow></mml:msub></mml:mtd><mml:mtd><mml:msub><mml:mrow><mml:mi>&#x003B8;</mml:mi></mml:mrow><mml:mrow><mml:mn>55</mml:mn></mml:mrow></mml:msub></mml:mtd></mml:mtr></mml:mtable></mml:mrow><mml:mo>]</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where by default <italic>&#x003B8;</italic><sub><italic>ij</italic></sub> &#x0003D; 0.1 for <italic>i</italic> &#x02260; <italic>j</italic> and <italic>&#x003B8;</italic><sub><italic>ij</italic></sub> &#x0003D; 0.3 otherwise. In <xref ref-type="fig" rid="F2">Figure 2</xref> we visualize results from three different variations of <xref ref-type="disp-formula" rid="E5">Equation (2)</xref> described above. In the first setting, we varied the between-community connectivity between pair of spatially disjoint communities 1 and 3 and the pair of bordering communities 4 and 5 to analyze the interplay between between-community connectivity and spatial co-localization (<xref ref-type="fig" rid="F2">Figure 2A</xref>). When we selectively decrease SNR by setting <italic>&#x003B8;</italic><sub>13</sub> &#x0003D; <italic>&#x003B8;</italic><sub>45</sub> &#x0003D; 0.175, BANYAN is still able to perfectly recover sub-population labels. However, when we further decrease SNR by increasing <italic>&#x003B8;</italic><sub>13</sub> &#x0003D; <italic>&#x003B8;</italic><sub>45</sub> &#x0003D; 0.225, we find that sub-population inference is corrupted. Notably, as the SNR approaches 1, BANYAN merges sub-populations 4 and 5 first, as they feature high between-community connectivity <italic>and</italic> spatial proximity. Alternatively, BANYAN splits sub-population 1 into two distinct communities instead of combining sub-populations 1 and 3, which are spatially disjoint. In <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S2</xref>, we visualize this trend across a finer grid of <italic>&#x003B8;</italic><sub>13</sub> and <italic>&#x003B8;</italic><sub>45</sub>. In <xref ref-type="fig" rid="F2">Figure 2B</xref>, we demonstrate this phenomenon from different perspective, in which decreasing the clustering resolution from <italic>K</italic> &#x0003D; 5 to <italic>K</italic> &#x0003D; 4 features merging of the two distinct sub-population 1 components due to their spatial proximity and high connectivity. Finally, in setting 3 (<xref ref-type="fig" rid="F2">Figure 2C</xref>), we investigated the effect of selectively decreasing within-community connectivity parameters for sub-populations 1, 2, and 3. We find that at low SNR settings of <italic>&#x003B8;</italic><sub>11</sub> &#x0003D; <italic>&#x003B8;</italic><sub>22</sub> &#x0003D; <italic>&#x003B8;</italic><sub>33</sub> &#x0003D; 0.2, BANYAN is unable to properly allocate cell spot labels, while increasing the SNR by increasing <italic>&#x003B8;</italic><sub>11</sub> &#x0003D; <italic>&#x003B8;</italic><sub>22</sub> &#x0003D; <italic>&#x003B8;</italic><sub>33</sub> &#x0003D; 0.25 results in correct recovery of ground truth labels. In <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S3</xref>, we provide results from across a finer grid of <italic>&#x003B8;</italic><sub>11</sub>, <italic>&#x003B8;</italic><sub>22</sub>, and <italic>&#x003B8;</italic><sub>33</sub>. The results from settings 1&#x02013;3 in <xref ref-type="fig" rid="F2">Figure 2</xref> highlight a characteristic of the spatially-aware MLSBM, namely that the model places a preference on merging spatially neighboring communities instead of spatially separate communities when the SNRs for each pair are equally low (i.e., approaches SNR = 1).</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>Simulation studies using sagittal mouse brain tissue sample with five cell spot clusters. <bold>(A)</bold> Simulation setting 1, where within-community connectivity (WCC) is 0.3, two between-community connectivity (BCC) (<italic>&#x003B8;</italic><sub>12</sub> and <italic>&#x003B8;</italic><sub>45</sub>) vary from 0.175 to 0.225, and the rest BCC are set to 0.1. <bold>(B)</bold> Simulation setting 2, where WCC is 0.3, two BCC (<italic>&#x003B8;</italic><sub>13</sub> and <italic>&#x003B8;</italic><sub>45</sub>) were set to 0.2, the rest BCC were set to 0.1. The number of communities varies from 5 to 4. <bold>(C)</bold> Simulation setting 3, where all the BCC were set to 0.1, two WCC were set to 0.3, and we vary three WCC from 0.2 to 0.25.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fams-10-1403901-g0002.tif"/>
</fig>
</sec>
<sec>
<title>3.2 Identifying cellular interplay in human melanoma brain metastases</title>
<p>Brain metastases are a common cancer complication, arising most often from lung cancer, breast cancer, and melanoma and occurring in nearly 30% of patients with solid tumors [<xref ref-type="bibr" rid="B25">25</xref>]. In the United States, an estimated 98,000 to 170,000 patients are diagnosed with brain metastases each year, and the incidence is increasing [<xref ref-type="bibr" rid="B26">26</xref>]. Due to the fact that conventional therapies can rarely cure brain metastases, researchers have been seeking alternative treatment options, and immunotherapy is one promising candidate [<xref ref-type="bibr" rid="B27">27</xref>]. In recent years, many scientific efforts have been devoted to investigating the interaction between the immune system and the tumor microenvironment (TME) of brain metastases, shedding light on the immune biology of brain metastases. For instance, Sudmeier et al. [<xref ref-type="bibr" rid="B28">28</xref>] reported that human brain metastases are well infiltrated by CD8<sup>&#x0002B;</sup> T cells.</p>
<p>To better understand the spatial distribution of immune cells in brain metastases TME and their interactive relationship with tumor cells, we applied BANYAN to the human melanoma brain metastasis sample from Sudmeier et al. [<xref ref-type="bibr" rid="B28">28</xref>], who applied spatial transcriptomics and identified distinct tumor, inflammatory, and blood cell sub-populations. Using BANYAN, we identified four spatially distinct spot sub-populations (<xref ref-type="fig" rid="F3">Figure 3A</xref>), characterized the function of each sub-population in the TME using known marker genes (<xref ref-type="fig" rid="F3">Figure 3B</xref>; <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S4</xref>), and studied the similarity structure among cell spots within and between sub-populations (<xref ref-type="fig" rid="F3">Figures 3C</xref>, <xref ref-type="fig" rid="F3">D</xref>). The identified sub-populations from BANYAN closely resemble the TME regions reported by Sudmeier et al. [<xref ref-type="bibr" rid="B28">28</xref>]. BANYAN sub-population 1 corresponds to blood cells, sub-population 2 to inflammatory immune cells, sub-population 3 to tumor-inflammatory adjacent cells, and sub-population 4 to the tumor region, respectively. Functional annotation based on the expression of marker genes (<xref ref-type="fig" rid="F3">Figure 3B</xref>; <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S4</xref>) further suggests sub-population 1 consists of naive cells, while both sub-populations 2 and 3 are CD8<sup>&#x0002B;</sup> T cells, and the expression of CD8<sup>&#x0002B;</sup> T cell markers are higher in sub-population 3 compared to those in sub-population 2.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Community structure in melanoma brain metastasis data. <bold>(A)</bold> Inferred cell spot sub-population labels from BANYAN. Line width indicates the between-community connectivity level, where the thicker the line, the higher the connectivity. Node size reflects within-community connectivity level, where the larger the node, the higher the connectivity. <bold>(B)</bold> Spatial plot and heatmap for tumor and T cell markers. <bold>(C)</bold> Within-community connectivity. <bold>(D)</bold> Between-community connectivity intervals. <bold>(E)</bold> Relationships between T cell receptor similarity and between-community connectivity. <bold>(F)</bold> The repertoire diversity for each sub-population.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fams-10-1403901-g0003.tif"/>
</fig>
<p>We then utilized BANYAN to implement ACC and characterize the interplay among the four identified sub-populations&#x02014;a unique functionality not offered by other HST analysis tools. When investigating within-community connectivity parameters in <xref ref-type="fig" rid="F3">Figure 3C</xref> (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S5</xref>), we observe a decreasing density of cell-cell connectivity as we move from outside to within the tumor. This pattern suggests additional cellular heterogeneity within the tumor relative to the surrounding inflammatory and blood tissue components. When consulting the between-community connectivity parameters in <xref ref-type="fig" rid="F3">Figure 3D</xref>, we find two distinct pairs of cell sub-populations: (2,3) and (1,2), which feature significantly higher inter-connectivity than all other pairs of sub-populations. These three sub-populations comprise the tumor-external components of the tissue sample and reflect a relatively high degree of inter-connectivity between blood, immune, and tumor-adjacent sub-populations. In comparison, the tumor region (sub-population 4) featured significantly lower inter-connectivity with the rest of the tissue sample, as evidenced by the significantly lower between-connectivity parameter estimates for the pairs of (3,4), (1,4), and (2,4) in <xref ref-type="fig" rid="F3">Figure 3D</xref>.</p>
<p>To better understand connectivity, we further analyzed the paired single-cell T cell receptor (TCR) sequencing data in terms of repertoire overlap and diversity (<xref ref-type="supplementary-material" rid="SM1">Supplementary Section S1</xref>). It turned out that the pairs with higher BCC values correspond to those with higher TCR similarity (<xref ref-type="fig" rid="F3">Figure 3E</xref>). Furthermore, sub-populations with higher WCC values (e.g., sub-populations 1 and 2) exhibited lower repertoire diversity compared to the ones with lower WCC values (<xref ref-type="fig" rid="F3">Figure 3F</xref>). The above relationships between WCC/BCC and TCR repertoire indicate that ACC holds the potential to uncover cellular dynamics under the setting of TME.</p>
</sec>
<sec>
<title>3.3 Discovering community structure in invasive ductal carcinoma</title>
<p>Accounting for roughly 25% of all non-dermal cancers in women, breast cancer ranks as the most common non-dermal female-specific cancer type, and narrowly the most common cancer type across both sexes [<xref ref-type="bibr" rid="B29">29</xref>]. Of all sub-types, invasive ductal carcinoma (IDC) is the most common and most severe, accounting for roughly 80% of all breast cancers in women [<xref ref-type="bibr" rid="B30">30</xref>]. While previous authors have used spatial transcriptomics to study IDC samples relative to ductal carcinoma in situ (DCIS) samples [<xref ref-type="bibr" rid="B31">31</xref>], IDC has yet to be studied through the lens of community structure due to the lack of computational tools available for performing ACC with HST data.</p>
<p>To illustrate ACC in the tumor microenvironment, we applied BANYAN to a publicly available IDC sample sequenced with the 10 &#x000D7; Visium platform [<xref ref-type="bibr" rid="B32">32</xref>]. We identified five spatially distinct cell spot sub-populations (<xref ref-type="fig" rid="F4">Figure 4A</xref>), and then identified community structure by computing posterior estimates of within and between-community connectivity parameters, as displayed in <xref ref-type="fig" rid="F4">Figures 4B</xref>, <xref ref-type="fig" rid="F4">C</xref>, respectively. Finally, to interpret each sub-population in terms of IDC biology, we computed the most differentially expressed genes between each sub-population and all others using the Wilcoxon rank-sum test implemented in the Seurat package (details in <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>) (<xref ref-type="fig" rid="F4">Figure 4D</xref>). <xref ref-type="fig" rid="F4">Figure 4D</xref> displays a clear block structure in the expression of sub-population marker genes, indicating a strong community structure signal in the data. When considered together with their spatial distribution (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S6</xref>), these marker genes can be used to obtain many interesting biological insights regarding the community structure of the IDC sample. For instance, the <italic>S100A11</italic> gene, a marker for sub-population 1, is a diagnostic marker in breast cancers [<xref ref-type="bibr" rid="B33">33</xref>] and has been implicated in aggressive tumor progression [<xref ref-type="bibr" rid="B34">34</xref>]. Further, <italic>KRT8</italic> is used to differentiate aggressive grades of IDCs [<xref ref-type="bibr" rid="B35">35</xref>]. While outside of the context of IDCs, <italic>DEGS2</italic> has been shown to play a role in the invasion and metastasis of colorectal cancer [<xref ref-type="bibr" rid="B36">36</xref>]. Taken together, these marker genes suggest that sub-population 1 contains a relatively high abundance of aggressive and invasive cancer cell types. On the other hand, sub-population 2 featured marker genes such as <italic>MALAT1</italic> that are associated with tumor suppressive behaviors in IDCs [<xref ref-type="bibr" rid="B37">37</xref>]. Another marker gene for sub-population 2, <italic>CCDC80</italic>, has been linked with tumor suppressive functions, albeit not in the context of IDCs [<xref ref-type="bibr" rid="B38">38</xref>].</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>Community structure in invasive ductal carcinoma. <bold>(A)</bold> Inferred cell spot sub-population labels from BANYAN. <bold>(B)</bold> Within-community connectivity parameters reflect the homogeneity of sub-populations. Higher connectivity values reflect higher homogeneity within sub-populations. <bold>(C)</bold> Between-community connectivity parameters reflect the relative similarity of cell spots between sub-populations. Higher connectivity values reflect more similarity between sub-populations. <bold>(D)</bold> Normalized expression of differentially expressed sub-population markers genes.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fams-10-1403901-g0004.tif"/>
</fig>
<p>Given these brief characterizations of sub-populations 1 and 2 available from the existing literature, we may hypothesize that these groups of cell spots are in some sense opposed in terms of their role within the tumor based on their transcriptional profiles. Indeed, these sub-populations also reside spatially at opposite ends of the tumor slice. We may investigate the similarity or dissimilarity of these sub-populations 1 and 2 using the between-community connectivity parameters presented in <xref ref-type="fig" rid="F4">Figure 4C</xref>. We find that the estimate of this parameter is near zero [as evidenced by the 95% credible for community pair (1,2) in <xref ref-type="fig" rid="F4">Figure 4C</xref>], supporting our hypothesized dissimilarity between sub-populations 1 and 2. In fact, sub-population 1 featured very low between-community connectivity with all other sub-populations besides sub-population 4 [e.g., significantly higher connectivity was featured between sub-populations pairs (1,4) than (1,2) as shown in <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure S7</xref>], which occupies a heterogeneous &#x0201C;background&#x0201D; position in the spatial landscape of the tissue sample (<xref ref-type="fig" rid="F4">Figure 4A</xref>) and therefore featured relatively high connectivity with all other communities. This spatial heterogeneity is accompanied by relatively low within-community connectivity (<xref ref-type="fig" rid="F4">Figure 4B</xref>), which indicates that spot-spot similarities are less common between cell spots in sub-population 4 than in other sub-populations. In <xref ref-type="fig" rid="F4">Figure 4D</xref>, it can be seen that many of the marker genes for sub-population 2 are shared by sub-population 4, including <italic>MALAT1</italic>, suggesting a similarity between these two sub-populations in terms of transcriptional profiles. In addition to the marker genes shared with sub-population 2, sub-population 4 features several of its own distinct marker genes, namely the immunoglobulin heavy chain-encoding RNAs <italic>IGHG1</italic> and <italic>IGHG3</italic>. These genes themselves have been shown to feature tumor suppressive tendencies via promotion of B cell-specific immunoglobulin [<xref ref-type="bibr" rid="B39">39</xref>], and have been associated with increased patient survival [<xref ref-type="bibr" rid="B40">40</xref>]. This observation of functional similarity between sub-populations 2 and 4 is validated by <xref ref-type="fig" rid="F4">Figure 4C</xref>, which clearly shows the highest estimated between-community connectivity in the data occurring between sub-populations 2 and 4. Taken together, these observations may lead us to reason that the sub-population 1 vs. 2 dynamic described previously is linked via the more heterogeneous yet still tumor suppressive-like sub-population 4. While these observations would require further experimental validation to confirm, they showcase the unique ability of BANYAN to describe community structure in the data.</p>
</sec>
<sec>
<title>3.4 Discovering spatial niches in human non-small cell lung cancer tissues</title>
<p>Next, we applied BANYAN to public data from the NanoString CosMx Spatial Molecular Imager (SMI) platform [<xref ref-type="bibr" rid="B41">41</xref>]. The original dataset consists of measurements of eight samples from five non-small-cell lung cancer (NSCLC) formalin-fixed paraffin-embedded (FFPE) tissues, with a total of 800,327 cells. Here we used one of eight samples (lung 5, replicate 1) for the illustration purpose. We further extracted cells corresponding to basal, macrophage, CD4<sup>&#x0002B;</sup> T, and CD8<sup>&#x0002B;</sup> T cells types based on the annotation using the Azimuth Healthy Human Lung reference [<xref ref-type="bibr" rid="B14">14</xref>, <xref ref-type="bibr" rid="B42">42</xref>]. Finally, we randomly downsampled the original data to 8,000 cells to aid in readability and allow for more rapid MCMC convergence.</p>
<p>Using BANYAN, we identified four sub-populations (<xref ref-type="fig" rid="F5">Figure 5A</xref>), investigated the marker genes for each sub-population (<xref ref-type="fig" rid="F5">Figure 5B</xref>), and examined the within- and between-community connectivity (<xref ref-type="fig" rid="F5">Figures 5C</xref>, <xref ref-type="fig" rid="F5">D</xref>). The identified four sub-populations closely matched the spatially resolved neighborhood niches reported in the previous literature [<xref ref-type="bibr" rid="B43">43</xref>]. Each of BANYAN sub-populations 1 to 4 mainly correspond to tumor cells, myeloid-enriched stroma cells, lymphoid structures, and stroma cells, respectively. The spatial distribution of markers for each sub-population confirmed this correspondence. For instance, <italic>KRT17</italic> is a specific marker for basal cells and commonly used diagnostic marker for tumors [<xref ref-type="bibr" rid="B44">44</xref>], and it is highly expressed in sub-population 1. <italic>C1QA, C1QB</italic>, and <italic>C1QC</italic> are markers for macrophages [<xref ref-type="bibr" rid="B45">45</xref>] (macrophages are myeloid lineage cells [<xref ref-type="bibr" rid="B46">46</xref>]), and they are significantly highly expressed in sub-population 2. <italic>IL7R</italic> is a lymphoid-associated gene and we observed its over-expression in sub-population 3.</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p>Community structure in human non-small-cell lung cancer tissue. <bold>(A)</bold> Inferred sub-populations from BANYAN. <bold>(B)</bold> Spatial plots for marker genes for each sub-population. <bold>(C)</bold> Within-community connectivity between cells belonging to each sub-population. <bold>(D)</bold> Between-community connectivity between cell sub-populations.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fams-10-1403901-g0005.tif"/>
</fig>
<p>While examining these sub-populations, we found that the sub-population 4 (stroma cells) is more heterogeneous than the other sub-populations. It consists of all four cell types and each cell type constitutes a fair proportion of the sub-population, while other sub-populations are mostly dominated by only one cell type. This heterogeneity differences among sub-populations may further explain the within-community connectivity: sub-population 3 is dominated by CD4<sup>&#x0002B;</sup> and CD8<sup>&#x0002B;</sup> T cells (proportion around 90%) and has the highest within-community connectivity. Likewise, nearly 81% of sub-population 2 are macrophages, potentially explaining its second-highest within-community connectivity. For sub-population 1, 99% of the cells are tumor cells, which themselves display high heterogeneity. In the case of between-community connectivity, as before, the observations may be mainly explained by spatial adjacency: sub-population 4 neighbors with all the other sub-populations and the connectivity involved in this sub-population are high [e.g., the (2,4), (3,4) and (1,4) pairs].</p></sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<p>We have proposed BANYAN: a network-based statistical framework for the analysis of community connectivity in HST data. In our simulation study, we validate BANYAN&#x00027;s ability to recover the community connectivity structure, even in the case of relatively low SNR, by considering both gene expression similarity and spatial proximity. We applied BANYAN to human melanoma brain metastases, human breast cancer, and human lung cancer, to illustrate its utility in applied settings. In the human melanoma brain metastasis case study, within-community connectivity parameters indicated increasing within-community heterogeneity as we move from outside to within the tumor. In addition, between-community connectivity parameters indicated a higher degree of inter-connectivity between blood, immune, and tumor-adjacent subpopulations, compared to those associated with the tumor region. Besides, we found interesting relationships between community WCC/BCC and TCR repertoire, which indicates that ACC holds the potential to uncover cellular dynamics under the setting of TME. In the breast cancer case study, we found a strong community structure, with sub-populations marked by both invasive cancer and cancer-suppressive marker genes. Using community structure parameters, we also identified an intermediate sub-population between these two. In the human-small-cell lung cancer case study, we observe the relevance of within-community connectivity with the heterogeneity of each cell spot cluster, as illustrated with the stroma cell sub-population.</p>
<p>There are several ways our work may be extended. First, often the SBM is refined to accommodate heterogeneous degree distributions among nodes, i.e., <italic>degree correction</italic> [<xref ref-type="bibr" rid="B47">47</xref>]. By making this methodological extension to the MLSBM at the core of BANYAN, one could relax our assumption that each cell spot features the same number of neighbors and thereby allow for certain cells spots to feature more connections to the rest of the tissue than other cell spots, such as those on the periphery of the tissue sample. Learning the degree of each cell spot would then inform the detection of highly connected &#x0201C;hub&#x0201D; regions, or weakly connected &#x0201C;satellite&#x0201D; regions of a tissue sample. Second, it is possible to allow gene expression and spatial information to be weighed in a data-adaptive manner, although tuning of appropriate weights would be necessary. Third, another extension could be to relax the assumption that gene expression and spatial location layers are governed by common community structure parameters, and instead allow for layer-specific interpretations of community structure. Fourth, the inherent complexity of network data structures leads to a heavy computational burden for large HST experiments. While we implement our proposed MCMC sampling algorithm using efficient <monospace>Rcpp</monospace> routines, BANYAN still requires significantly more computational time than non-network statistical methods [<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>]. Further optimization would help to reduce the computational burden of community connectivity analysis. Finally, while BANYAN provides the first statistical framework for quantifying community connectivity structure in HST data, further extensions could be made to link BANYAN with methods for predicting cell-cell interactions using data such as ligand-receptor pair status of cells. By doing so, one could refine the general notion of cell spot connectivity to cell spot interaction, which is of major interest in HST data analysis. In this sense, BANYAN establishes a promising statistical framework that may be extended to a wide range of analyses focused on investigating the interactive nature of HST data.</p></sec>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: human melanoma brain metastasis data (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE179572">https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE179572</ext-link>), invasive ductal carcinoma data (<ext-link ext-link-type="uri" xlink:href="https://support.10xgenomics.com/spatial-geneexpression/datasets/1.0.0/V1_Breast_Cancer_Block_A_Section_1">https://support.10xgenomics.com/spatial-geneexpression/datasets/1.0.0/V1_Breast_Cancer_Block_A_Section_1</ext-link>), and human non-small cell lung cancer CosMx data (<ext-link ext-link-type="uri" xlink:href="https://nanostring.com/products/cosmx-spatialmolecular-imager/nsclc-ffpe-dataset/">https://nanostring.com/products/cosmx-spatialmolecular-imager/nsclc-ffpe-dataset/</ext-link>). The proposed approach was implemented as an open-source R package &#x0201C;banyan&#x0201D; and it is publicly available at <ext-link ext-link-type="uri" xlink:href="https://github.com/dongjunchung/banyan">https://github.com/dongjunchung/banyan</ext-link>.</p></sec>
<sec sec-type="author-contributions" id="s6">
<title>Author contributions</title>
<p>JX: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Validation, Visualization, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. KJ: Conceptualization, Formal analysis, Investigation, Methodology, Visualization, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing, Validation. CA: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Software, Visualization, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing, Validation. YC: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Validation, Visualization, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. SP: Investigation, Methodology, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. ZL: Investigation, Resources, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. QM: Conceptualization, Funding acquisition, Investigation, Methodology, Project administration, Resources, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. DC: Conceptualization, Funding acquisition, Investigation, Methodology, Project administration, Resources, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing.</p></sec>
</body>
<back>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This work was supported in part by the NIH/NHGRI grant R21-HG012482, NIH/NIGMS grants R01-GM122078 and R01-GM131399, NIH/NIDA grant U01-DA045300, NIH/NIA grant U54-AG075931, and NSF grant NSF1945971.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>CA was employed by Eli Lilly and Company. The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s8">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec><sec sec-type="supplementary-material" id="s9">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fams.2024.1403901/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fams.2024.1403901/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Asp</surname> <given-names>M</given-names></name> <name><surname>Bergenstrahle</surname> <given-names>J</given-names></name> <name><surname>Lundeberg</surname> <given-names>J</given-names></name></person-group>. <article-title>Spatially resolved transcriptomes&#x00027; next generation tools for tissue exploration</article-title>. <source>BioEssays</source>. (<year>2020</year>) <volume>42</volume>:<fpage>1900221</fpage>. <pub-id pub-id-type="doi">10.1002/bies.201900221</pub-id><pub-id pub-id-type="pmid">32363691</pub-id></citation></ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chang</surname> <given-names>Y</given-names></name> <name><surname>He</surname> <given-names>F</given-names></name> <name><surname>Wang</surname> <given-names>J</given-names></name> <name><surname>Chen</surname> <given-names>S</given-names></name> <name><surname>Li</surname> <given-names>J</given-names></name> <name><surname>Liu</surname> <given-names>J</given-names></name> <etal/></person-group>. <article-title>Define and visualize pathological architectures of human tissues from spatially resolved transcriptomics using deep learning</article-title>. <source>Comput Struct Biotechnol J</source>. (<year>2022</year>) <volume>20</volume>:<fpage>4600</fpage>&#x02013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1016/j.csbj.2022.08.029</pub-id><pub-id pub-id-type="pmid">36090815</pub-id></citation></ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>J</given-names></name> <name><surname>Li</surname> <given-names>X</given-names></name> <name><surname>Coleman</surname> <given-names>K</given-names></name> <name><surname>Schroeder</surname> <given-names>A</given-names></name> <name><surname>Ma</surname> <given-names>N</given-names></name> <name><surname>Irwin</surname> <given-names>DJ</given-names></name> <etal/></person-group>. <article-title>SpaGCN: integrating gene expression, spatial location and histology to identify spatial domains and spatially variable genes by graph convolutional network</article-title>. <source>Nat Methods</source>. (<year>2021</year>) <volume>18</volume>:<fpage>1342</fpage>&#x02013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-021-01255-8</pub-id><pub-id pub-id-type="pmid">34711970</pub-id></citation></ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Canozo</surname> <given-names>FJG</given-names></name> <name><surname>Zuo</surname> <given-names>Z</given-names></name> <name><surname>Martin</surname> <given-names>JF</given-names></name> <name><surname>Samee</surname> <given-names>MAH</given-names></name></person-group>. <article-title>Cell-type modeling in spatial transcriptomics data elucidates spatially variable colocalization and communication between cell-types in mouse brain</article-title>. <source>Cell Syst</source>. (<year>2022</year>) <volume>13</volume>:<fpage>58</fpage>&#x02013;<lpage>70</lpage>. <pub-id pub-id-type="doi">10.1016/j.cels.2021.09.004</pub-id><pub-id pub-id-type="pmid">34626538</pub-id></citation></ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dries</surname> <given-names>R</given-names></name> <name><surname>Zhu</surname> <given-names>Q</given-names></name> <name><surname>Dong</surname> <given-names>R</given-names></name> <name><surname>Eng CHL Li</surname> <given-names>H</given-names></name> <name><surname>Liu</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Giotto: a toolbox for integrative analysis and visualization of spatial expression data</article-title>. <source>Genome Biol</source>. (<year>2021</year>) <volume>22</volume>:<fpage>1</fpage>&#x02013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1186/s13059-021-02286-2</pub-id><pub-id pub-id-type="pmid">33685491</pub-id></citation></ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pham</surname> <given-names>D</given-names></name> <name><surname>Tan</surname> <given-names>X</given-names></name> <name><surname>Balderson</surname> <given-names>B</given-names></name> <name><surname>Xu</surname> <given-names>J</given-names></name> <name><surname>Grice</surname> <given-names>LF</given-names></name> <name><surname>Yoon</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Robust mapping of spatiotemporal trajectories and cell-cell interactions in healthy and diseased tissues</article-title>. <source>Nat Commun</source>. (<year>2023</year>) <volume>14</volume>:<fpage>7739</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-023-43120-6</pub-id><pub-id pub-id-type="pmid">38007580</pub-id></citation></ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>E</given-names></name> <name><surname>Stone</surname> <given-names>MR</given-names></name> <name><surname>Ren</surname> <given-names>X</given-names></name> <name><surname>Pulliam</surname> <given-names>T</given-names></name> <name><surname>Nghiem</surname> <given-names>P</given-names></name> <name><surname>Bielas</surname> <given-names>JH</given-names></name> <etal/></person-group>. <article-title>Spatial transcriptomics at subspot resolution with BayesSpace</article-title>. <source>Nat Biotechnol</source>. (<year>2021</year>) <volume>39</volume>:<fpage>1375</fpage>&#x02013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-021-00935-2</pub-id><pub-id pub-id-type="pmid">34083791</pub-id></citation></ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Allen</surname> <given-names>C</given-names></name> <name><surname>Chang</surname> <given-names>Y</given-names></name> <name><surname>Neelon</surname> <given-names>B</given-names></name> <name><surname>Chang</surname> <given-names>W</given-names></name> <name><surname>Kim</surname> <given-names>HJ</given-names></name> <name><surname>Li</surname> <given-names>Z</given-names></name> <etal/></person-group>. <article-title>A Bayesian multivariate mixture model for spatial transcriptomics data</article-title>. <source>Biometrics</source>. (<year>2023</year>) <volume>79</volume>:<fpage>1775</fpage>&#x02013;<lpage>87</lpage>. <pub-id pub-id-type="doi">10.1111/biom.13727</pub-id><pub-id pub-id-type="pmid">35895854</pub-id></citation></ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Barresi</surname> <given-names>MJF</given-names></name> <name><surname>Gilbert</surname> <given-names>SF</given-names></name></person-group>. <source>Developmental Biology, Vol. 12</source>. <publisher-loc>Sunderland, MA</publisher-loc>: <publisher-name>Sinauer Associates</publisher-name> (<year>2019</year>).</citation>
</ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Armingol</surname> <given-names>E</given-names></name> <name><surname>Officer</surname> <given-names>A</given-names></name> <name><surname>Harismendy</surname> <given-names>O</given-names></name> <name><surname>Lewis</surname> <given-names>NE</given-names></name></person-group>. <article-title>Deciphering cell-cell interactions and communication from gene expression</article-title>. <source>Nat Rev Genet</source>. (<year>2021</year>) <volume>22</volume>:<fpage>71</fpage>&#x02013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.1038/s41576-020-00292-x</pub-id><pub-id pub-id-type="pmid">33168968</pub-id></citation></ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Guzzi</surname> <given-names>PH</given-names></name> <name><surname>Roy</surname> <given-names>S</given-names></name></person-group>. <source>Biological Network Analysis: Trends, Approaches, Graph Theory, and Algorithms</source>. <publisher-loc>Amsterdam</publisher-loc>: <publisher-name>Elsevier</publisher-name> (<year>2020</year>). <pub-id pub-id-type="doi">10.1016/B978-0-12-819350-1.00011-6</pub-id></citation>
</ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nowicki</surname> <given-names>K</given-names></name> <name><surname>Snijders</surname> <given-names>TAB</given-names></name></person-group>. <article-title>Estimation and prediction for stochastic blockstructures</article-title>. <source>J Am Stat Assoc</source>. (<year>2001</year>) <volume>96</volume>:<fpage>1077</fpage>&#x02013;<lpage>87</lpage>. <pub-id pub-id-type="doi">10.1198/016214501753208735</pub-id><pub-id pub-id-type="pmid">12611515</pub-id></citation></ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Valles-Catala</surname> <given-names>T</given-names></name> <name><surname>Massucci</surname> <given-names>FA</given-names></name> <name><surname>Guimera</surname> <given-names>R</given-names></name> <name><surname>Sales-Pardo</surname> <given-names>M</given-names></name></person-group>. <article-title>Multilayer stochastic block models reveal the multilayer structure of complex networks</article-title>. <source>Phys Rev X</source>. (<year>2016</year>) <volume>6</volume>:<fpage>011036</fpage>. <pub-id pub-id-type="doi">10.1103/PhysRevX.6.011036</pub-id><pub-id pub-id-type="pmid">33044929</pub-id></citation></ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hao</surname> <given-names>Y</given-names></name> <name><surname>Hao</surname> <given-names>S</given-names></name> <name><surname>Andersen-Nissen</surname> <given-names>E</given-names></name> <name><surname>Mauck</surname> <given-names>WM</given-names></name> <name><surname>Zheng</surname> <given-names>S</given-names></name> <name><surname>Butler</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>Integrated analysis of multimodal single-cell data</article-title>. <source>Cell</source>. (<year>2021</year>) <volume>184</volume>:<fpage>3573</fpage>&#x02013;<lpage>87</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2021.04.048</pub-id><pub-id pub-id-type="pmid">34062119</pub-id></citation></ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Seurat</surname> <given-names>- Guided Clustering Tutoria</given-names></name></person-group>. (<year>2021</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://satijalab.org/seurat/articles/pbmc3k_tutorial.html">https://satijalab.org/seurat/articles/pbmc3k_tutorial.html</ext-link> (accessed May 27, 2021).</citation>
</ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>Analysis visualization and and integration of spatial datasets with Seurat</collab></person-group>. (<year>2021</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://satijalab.org/seurat/articles/spatial_vignette.html&#x00023;acknowledgments-1">https://satijalab.org/seurat/articles/spatial_vignette.html&#x00023;acknowledgments-1</ext-link> (accessed May 27, 2021).</citation>
</ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Stork</surname> <given-names>DG</given-names></name> <name><surname>Duda</surname> <given-names>RO</given-names></name> <name><surname>Hart</surname> <given-names>PE</given-names></name> <name><surname>Stork</surname> <given-names>D</given-names></name></person-group>. <source>Pattern Classification</source>. <publisher-loc>Hoboken, NJ</publisher-loc>: <publisher-name>A Wiley-Interscience Publication</publisher-name> (<year>2001</year>).</citation>
</ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Snijders</surname> <given-names>TA</given-names></name> <name><surname>Nowicki</surname> <given-names>K</given-names></name></person-group>. <article-title>Estimation and prediction for stochastic blockmodels for graphs with latent block structure</article-title>. <source>J Classif</source> . (<year>1997</year>) <volume>14</volume>:<fpage>75</fpage>&#x02013;<lpage>100</lpage>. <pub-id pub-id-type="doi">10.1007/s003579900004</pub-id></citation>
</ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Gelman</surname> <given-names>A</given-names></name> <name><surname>Carlin</surname> <given-names>JB</given-names></name> <name><surname>Stern</surname> <given-names>HS</given-names></name> <name><surname>Dunson</surname> <given-names>DB</given-names></name> <name><surname>Vehtari</surname> <given-names>A</given-names></name> <name><surname>Rubin</surname> <given-names>DB</given-names></name></person-group>. <source>Bayesian Data Analysis</source>. <publisher-loc>Boca Raton, FL</publisher-loc>: <publisher-name>CRC Press</publisher-name> (<year>2013</year>). <pub-id pub-id-type="doi">10.1201/b16018</pub-id><pub-id pub-id-type="pmid">38367612</pub-id></citation></ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Blondel</surname> <given-names>VD</given-names></name> <name><surname>Guillaume</surname> <given-names>JL</given-names></name> <name><surname>Lambiotte</surname> <given-names>R</given-names></name> <name><surname>Lefebvre</surname> <given-names>E</given-names></name></person-group>. <article-title>Fast unfolding of communities in large networks</article-title>. <source>J Stat Mech Theor Exp</source>. (<year>2008</year>) <volume>2008</volume>:<fpage>P10008</fpage>. <pub-id pub-id-type="doi">10.1088/1742-5468/2008/10/P10008</pub-id></citation>
</ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Papastamoulis</surname> <given-names>P</given-names></name></person-group>. <article-title>label</article-title>.switching: an R Package for dealing with the label switching problem in MCMC outputs. <source>J Stat Softw</source>. (<year>2016</year>) <volume>69</volume>:<fpage>1</fpage>&#x02013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.18637/jss.v069.c01</pub-id></citation>
</ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peng</surname> <given-names>L</given-names></name> <name><surname>Carvalho</surname> <given-names>L</given-names></name></person-group>. <article-title>Bayesian degree-corrected stochastic blockmodels for community detection</article-title>. <source>Electron J Stat</source>. (<year>2016</year>) <volume>10</volume>:<fpage>2746</fpage>&#x02013;<lpage>79</lpage>. <pub-id pub-id-type="doi">10.1214/16-EJS1163</pub-id></citation>
</ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stuart</surname> <given-names>T</given-names></name> <name><surname>Butler</surname> <given-names>A</given-names></name> <name><surname>Hoffman</surname> <given-names>P</given-names></name> <name><surname>Hafemeister</surname> <given-names>C</given-names></name> <name><surname>Papalexi</surname> <given-names>E</given-names></name> <name><surname>Mauck III</surname> <given-names>WM</given-names></name> <etal/></person-group>. <article-title>Comprehensive integration of single-cell data</article-title>. <source>Cell</source>. (<year>2019</year>) <volume>177</volume>:<fpage>1888</fpage>&#x02013;<lpage>902</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2019.05.031</pub-id><pub-id pub-id-type="pmid">31178118</pub-id></citation></ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="web"><person-group person-group-type="author"><name><surname>x</surname> <given-names>Genomics</given-names></name></person-group>. <source>Mouse Brain Serial Section 1 (Sagittal-Anterior); Spatial Gene Expression Dataset by Space Ranger 1.0.0</source>. (<year>2019</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://support.10xgenomics.com/spatial-gene-expression/datasets/1.0.0/V1_Mouse_Brain_Sagittal_Anterior">https://support.10xgenomics.com/spatial-gene-expression/datasets/1.0.0/V1_Mouse_Brain_Sagittal_Anterior</ext-link> (accessed Septemper 6, 2021).</citation>
</ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Suh</surname> <given-names>JH</given-names></name> <name><surname>Kotecha</surname> <given-names>R</given-names></name> <name><surname>Chao</surname> <given-names>ST</given-names></name> <name><surname>Ahluwalia</surname> <given-names>MS</given-names></name> <name><surname>Sahgal</surname> <given-names>A</given-names></name> <name><surname>Chang</surname> <given-names>EL</given-names></name></person-group>. <article-title>Current approaches to the management of brain metastases</article-title>. <source>Nat Rev Clin Oncol</source>. (<year>2020</year>) <volume>17</volume>:<fpage>279</fpage>&#x02013;<lpage>99</lpage>. <pub-id pub-id-type="doi">10.1038/s41571-019-0320-3</pub-id><pub-id pub-id-type="pmid">32080373</pub-id></citation></ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sperduto</surname> <given-names>PW</given-names></name> <name><surname>Mesko</surname> <given-names>S</given-names></name> <name><surname>Li</surname> <given-names>J</given-names></name> <name><surname>Cagney</surname> <given-names>D</given-names></name> <name><surname>Aizer</surname> <given-names>A</given-names></name> <name><surname>Lin</surname> <given-names>NU</given-names></name> <etal/></person-group>. <article-title>Survival in patients with brain metastases: summary report on the updated diagnosis-specific graded prognostic assessment and definition of the eligibility quotient</article-title>. <source>J Clin Oncol</source>. (<year>2020</year>) <volume>38</volume>:<fpage>3773</fpage>. <pub-id pub-id-type="doi">10.1200/JCO.20.01255</pub-id><pub-id pub-id-type="pmid">32931399</pub-id></citation></ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Di Giacomo</surname> <given-names>AM</given-names></name> <name><surname>Valente</surname> <given-names>M</given-names></name> <name><surname>Cerase</surname> <given-names>A</given-names></name> <name><surname>Lofiego</surname> <given-names>MF</given-names></name> <name><surname>Piazzini</surname> <given-names>F</given-names></name> <name><surname>Calabr&#x000F2;</surname> <given-names>L</given-names></name> <etal/></person-group>. <article-title>Immunotherapy of brain metastases: breaking a &#x0201C;dogma&#x0201D;</article-title>. <source>J Exp Clin Cancer Res</source>. (<year>2019</year>) <volume>38</volume>:<fpage>1</fpage>&#x02013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1186/s13046-019-1426-2</pub-id><pub-id pub-id-type="pmid">31623643</pub-id></citation></ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sudmeier</surname> <given-names>LJ</given-names></name> <name><surname>Hoang</surname> <given-names>KB</given-names></name> <name><surname>Nduom</surname> <given-names>EK</given-names></name> <name><surname>Wieland</surname> <given-names>A</given-names></name> <name><surname>Neill</surname> <given-names>SG</given-names></name> <name><surname>Schniederjan</surname> <given-names>MJ</given-names></name> <etal/></person-group>. <article-title>Distinct phenotypic states and spatial distribution of CD8&#x0002B; T cell clonotypes in human brain metastases</article-title>. <source>Cell Rep Med</source>. (<year>2022</year>) <volume>3</volume>:<fpage>100620</fpage>. <pub-id pub-id-type="doi">10.1016/j.xcrm.2022.100620</pub-id><pub-id pub-id-type="pmid">35584630</pub-id></citation></ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="web"><person-group person-group-type="author"><collab>WCRF</collab></person-group>. <source>Worldwide cancer data</source>. (<year>2020</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.wcrf.org/dietandcancer/worldwide-cancer-data/">https://www.wcrf.org/dietandcancer/worldwide-cancer-data/</ext-link> (accessed January 4, 2022).</citation>
</ref>
<ref id="B30">
<label>30.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Harris</surname> <given-names>JR</given-names></name> <name><surname>Lippman</surname> <given-names>ME</given-names></name> <name><surname>Osborne</surname> <given-names>CK</given-names></name> <name><surname>Morrow</surname> <given-names>M</given-names></name></person-group>. <source>Diseases of the Breast</source>. <publisher-loc>Philadelphia, PA</publisher-loc>: <publisher-name>Lippincott Williams &#x00026; Wilkins</publisher-name> (<year>2012</year>).</citation>
</ref>
<ref id="B31">
<label>31.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yoosuf</surname> <given-names>N</given-names></name> <name><surname>Navarro</surname> <given-names>JF</given-names></name> <name><surname>Salm&#x000E9;n</surname> <given-names>F</given-names></name> <name><surname>St&#x000E5;hl</surname> <given-names>PL</given-names></name> <name><surname>Daub</surname> <given-names>CO</given-names></name></person-group>. <article-title>Identification and transfer of spatial transcriptomics signatures for cancer diagnosis</article-title>. <source>Breast Cancer Res</source>. (<year>2020</year>) <volume>22</volume>:<fpage>1</fpage>&#x02013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1186/s13058-019-1242-9</pub-id><pub-id pub-id-type="pmid">31931856</pub-id></citation></ref>
<ref id="B32">
<label>32.</label>
<citation citation-type="web"><person-group person-group-type="author"><name><surname>x</surname> <given-names>Genomics</given-names></name></person-group>. <source>Human Breast Cancer (Block A Section 1); Spatial Gene Expression Dataset by Space Ranger 1</source>.1.0. (<year>2020</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://support.10xgenomics.com/spatial-gene-expression/datasets/1.0.0/V1_Breast_Cancer_Block_A_Section_1">https://support.10xgenomics.com/spatial-gene-expression/datasets/1.0.0/V1_Breast_Cancer_Block_A_Section_1</ext-link> (accessed June 8, 2021).</citation>
</ref>
<ref id="B33">
<label>33.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>XG</given-names></name> <name><surname>Wang XP Li</surname> <given-names>WF</given-names></name> <name><surname>Yang</surname> <given-names>S</given-names></name> <name><surname>Zhou</surname> <given-names>X</given-names></name> <name><surname>Li</surname> <given-names>SJ</given-names></name> <etal/></person-group>. <article-title>Ca2&#x0002B;-binding protein S100A11: a novel diagnostic marker for breast carcinoma</article-title>. <source>Oncol Rep</source>. (<year>2010</year>) <volume>23</volume>:<fpage>1301</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.3892/or_00000764</pub-id><pub-id pub-id-type="pmid">20372844</pub-id></citation></ref>
<ref id="B34">
<label>34.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>McKiernan</surname> <given-names>E</given-names></name> <name><surname>McDermott</surname> <given-names>EW</given-names></name> <name><surname>Evoy</surname> <given-names>D</given-names></name> <name><surname>Crown</surname> <given-names>J</given-names></name> <name><surname>Duffy</surname> <given-names>MJ</given-names></name></person-group>. <article-title>The role of S100 genes in breast cancer progression</article-title>. <source>Tumor Biol</source>. (<year>2011</year>) <volume>32</volume>:<fpage>441</fpage>&#x02013;<lpage>50</lpage>. <pub-id pub-id-type="doi">10.1007/s13277-010-0137-2</pub-id><pub-id pub-id-type="pmid">21153724</pub-id></citation></ref>
<ref id="B35">
<label>35.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Walker</surname> <given-names>LC</given-names></name> <name><surname>Harris</surname> <given-names>GC</given-names></name> <name><surname>Holloway</surname> <given-names>AJ</given-names></name> <name><surname>McKenzie</surname> <given-names>GW</given-names></name> <name><surname>Wells</surname> <given-names>JE</given-names></name> <name><surname>Robinson</surname> <given-names>BA</given-names></name> <etal/></person-group>. <article-title>Cytokeratin KRT8/18 expression differentiates distinct subtypes of grade 3 invasive ductal carcinoma of the breast</article-title>. <source>Cancer Genet Cytogenet</source>. (<year>2007</year>) <volume>178</volume>:<fpage>94</fpage>&#x02013;<lpage>103</lpage>. <pub-id pub-id-type="doi">10.1016/j.cancergencyto.2007.06.002</pub-id><pub-id pub-id-type="pmid">17954264</pub-id></citation></ref>
<ref id="B36">
<label>36.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guo</surname> <given-names>W</given-names></name> <name><surname>Zhang</surname> <given-names>C</given-names></name> <name><surname>Feng</surname> <given-names>P</given-names></name> <name><surname>Li</surname> <given-names>M</given-names></name> <name><surname>Wang</surname> <given-names>X</given-names></name> <name><surname>Xia</surname> <given-names>Y</given-names></name> <etal/></person-group>. <article-title>M6A methylation of DEGS2, a key ceramide-synthesizing enzyme, is involved in colorectal cancer progression through ceramide synthesis</article-title>. <source>Oncogene</source>. (<year>2021</year>) <volume>40</volume>:<fpage>5913</fpage>&#x02013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1038/s41388-021-01987-z</pub-id><pub-id pub-id-type="pmid">34363020</pub-id></citation></ref>
<ref id="B37">
<label>37.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>J</given-names></name> <name><surname>Piao</surname> <given-names>HL</given-names></name> <name><surname>Kim</surname> <given-names>BJ</given-names></name> <name><surname>Yao</surname> <given-names>F</given-names></name> <name><surname>Han</surname> <given-names>Z</given-names></name> <name><surname>Wang</surname> <given-names>Y</given-names></name> <etal/></person-group>. <article-title>Long noncoding RNA MALAT1 suppresses breast cancer metastasis</article-title>. <source>Nat Genet</source>. (<year>2018</year>) <volume>50</volume>:<fpage>1705</fpage>&#x02013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1038/s41588-018-0252-3</pub-id><pub-id pub-id-type="pmid">30349115</pub-id></citation></ref>
<ref id="B38">
<label>38.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ferraro</surname> <given-names>A</given-names></name> <name><surname>Schepis</surname> <given-names>F</given-names></name> <name><surname>Leone</surname> <given-names>V</given-names></name> <name><surname>Federico</surname> <given-names>A</given-names></name> <name><surname>Borbone</surname> <given-names>E</given-names></name> <name><surname>Pallante</surname> <given-names>P</given-names></name> <etal/></person-group>. <article-title>Tumor suppressor role of the CL2/DRO1/CCDC80 gene in thyroid carcinogenesis</article-title>. <source>J Clin Endocrinol Metab</source>. (<year>2013</year>) <volume>98</volume>:<fpage>2834</fpage>&#x02013;<lpage>43</lpage>. <pub-id pub-id-type="doi">10.1210/jc.2012-2926</pub-id><pub-id pub-id-type="pmid">23666966</pub-id></citation></ref>
<ref id="B39">
<label>39.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hsu</surname> <given-names>HM</given-names></name> <name><surname>Chu</surname> <given-names>CM</given-names></name> <name><surname>Chang YJ Yu</surname> <given-names>JC</given-names></name> <name><surname>Chen</surname> <given-names>CT</given-names></name> <name><surname>Jian</surname> <given-names>CE</given-names></name> <etal/></person-group>. <article-title>Six novel immunoglobulin genes as biomarkers for better prognosis in triple-negative breast cancer by gene co-expression network analysis</article-title>. <source>Sci Rep</source>. (<year>2019</year>) <volume>9</volume>:<fpage>1</fpage>&#x02013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-40826-w</pub-id><pub-id pub-id-type="pmid">30872752</pub-id></citation></ref>
<ref id="B40">
<label>40.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larsson</surname> <given-names>C</given-names></name> <name><surname>Ehinger</surname> <given-names>A</given-names></name> <name><surname>Winslow</surname> <given-names>S</given-names></name> <name><surname>Leandersson</surname> <given-names>K</given-names></name> <name><surname>Klintman</surname> <given-names>M</given-names></name> <name><surname>Dahl</surname> <given-names>L</given-names></name> <etal/></person-group>. <article-title>Prognostic implications of the expression levels of different immunoglobulin heavy chain-encoding RNAs in early breast cancer</article-title>. <source>NPJ Breast Cancer</source>. (<year>2020</year>) <volume>6</volume>:<fpage>1</fpage>&#x02013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1038/s41523-020-0170-2</pub-id><pub-id pub-id-type="pmid">32656317</pub-id></citation></ref>
<ref id="B41">
<label>41.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lewis</surname> <given-names>ZR</given-names></name> <name><surname>Birditt</surname> <given-names>B</given-names></name> <name><surname>Brown</surname> <given-names>E</given-names></name> <name><surname>Chantranuvatana</surname> <given-names>K</given-names></name> <name><surname>Filanoski</surname> <given-names>B</given-names></name> <name><surname>Corless</surname> <given-names>C</given-names></name> <etal/></person-group>. <article-title>Single cell spatial molecular imaging of 76-plex proteins in clinical cancer samples in response to personalized treatment</article-title>. <source>Cancer Res</source>. (<year>2023</year>) 83(7_Supplement):5641. <pub-id pub-id-type="doi">10.1158/1538-7445.AM2023-5641</pub-id></citation>
</ref>
<ref id="B42">
<label>42.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Travaglini</surname> <given-names>KJ</given-names></name> <name><surname>Nabhan</surname> <given-names>AN</given-names></name> <name><surname>Penland</surname> <given-names>L</given-names></name> <name><surname>Sinha</surname> <given-names>R</given-names></name> <name><surname>Gillich</surname> <given-names>A</given-names></name> <name><surname>Sit</surname> <given-names>RV</given-names></name> <etal/></person-group>. <article-title>A molecular cell atlas of the human lung from single-cell RNA sequencing</article-title>. <source>Nature</source>. (<year>2020</year>) <volume>587</volume>:<fpage>619</fpage>&#x02013;<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-020-2922-4</pub-id><pub-id pub-id-type="pmid">33208946</pub-id></citation></ref>
<ref id="B43">
<label>43.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>He</surname> <given-names>S</given-names></name> <name><surname>Bhatt</surname> <given-names>R</given-names></name> <name><surname>Brown</surname> <given-names>C</given-names></name> <name><surname>Brown</surname> <given-names>EA</given-names></name> <name><surname>Buhr</surname> <given-names>DL</given-names></name> <name><surname>Chantranuvatana</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>High-plex imaging of RNA and proteins at subcellular resolution in fixed tissue by spatial molecular imaging</article-title>. <source>Nat Biotechnol</source>. (<year>2022</year>) <volume>40</volume>:<fpage>1794</fpage>&#x02013;<lpage>806</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-022-01483-z</pub-id><pub-id pub-id-type="pmid">36203011</pub-id></citation></ref>
<ref id="B44">
<label>44.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Z</given-names></name> <name><surname>Yang</surname> <given-names>MQ</given-names></name> <name><surname>Lei</surname> <given-names>L</given-names></name> <name><surname>Fei</surname> <given-names>LR</given-names></name> <name><surname>Zheng</surname> <given-names>YW</given-names></name> <name><surname>Huang</surname> <given-names>WJ</given-names></name> <etal/></person-group>. <article-title>Overexpression of KRT17 promotes proliferation and invasion of non-small cell lung cancer and indicates poor prognosis</article-title>. <source>Cancer Manag Res</source>. (<year>2019</year>) <volume>11</volume>:<fpage>7485</fpage>. <pub-id pub-id-type="doi">10.2147/CMAR.S218926</pub-id><pub-id pub-id-type="pmid">31496806</pub-id></citation></ref>
<ref id="B45">
<label>45.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Revel</surname> <given-names>M</given-names></name> <name><surname>Saut&#x000E8;s-Fridman</surname> <given-names>C</given-names></name> <name><surname>Fridman</surname> <given-names>WH</given-names></name> <name><surname>Roumenina</surname> <given-names>LT</given-names></name></person-group>. <article-title>C1q&#x0002B; macrophages: passengers or drivers of cancer progression</article-title>. <source>Trends Cancer</source>. (<year>2022</year>) <volume>8</volume>:<fpage>517</fpage>&#x02013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1016/j.trecan.2022.02.006</pub-id><pub-id pub-id-type="pmid">35288093</pub-id></citation></ref>
<ref id="B46">
<label>46.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gabrilovich</surname> <given-names>DI</given-names></name> <name><surname>Ostrand-Rosenberg</surname> <given-names>S</given-names></name> <name><surname>Bronte</surname> <given-names>V</given-names></name></person-group>. <article-title>Coordinated regulation of myeloid cells by tumours</article-title>. <source>Nat Rev Immunol</source>. (<year>2012</year>) <volume>12</volume>:<fpage>253</fpage>&#x02013;<lpage>68</lpage>. <pub-id pub-id-type="doi">10.1038/nri3175</pub-id><pub-id pub-id-type="pmid">22437938</pub-id></citation></ref>
<ref id="B47">
<label>47.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Karrer</surname> <given-names>B</given-names></name> <name><surname>Newman</surname> <given-names>ME</given-names></name></person-group>. <article-title>Stochastic blockmodels and community structure in networks</article-title>. <source>Phys Rev E</source>. (<year>2011</year>) <volume>83</volume>:<fpage>016107</fpage>. <pub-id pub-id-type="doi">10.1103/PhysRevE.83.016107</pub-id><pub-id pub-id-type="pmid">21405744</pub-id></citation></ref>
</ref-list>
</back>
</article>