<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cell. Infect. Microbiol.</journal-id>
<journal-title>Frontiers in Cellular and Infection Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cell. Infect. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">2235-2988</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fcimb.2023.1210807</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cellular and Infection Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Mendelian randomization analysis to investigate the gut microbiome in oral and oropharyngeal cancer</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Qihe</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Huanhuan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tian</surname>
<given-names>Yuan</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Jinjie</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Xin</surname>
<given-names>Ying</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1436368"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes" corresp="yes">
<name>
<surname>Jiang</surname>
<given-names>Xin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/682950"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Jilin Provincial Key Laboratory of Radiation Oncology &amp; Therapy, The First Hospital of Jilin University, and Key Laboratory of Pathobiology, Ministry of Education, Jilin University</institution>, <addr-line>Changchun</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Radiation Oncology, The First Hospital of Jilin University</institution>, <addr-line>Changchun</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>NHC Key Laboratory of Radiobiology, School of Public Health, Jilin University</institution>, <addr-line>Changchun</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Key Laboratory of Pathobiology, Ministry of Education, Jilin University</institution>, <addr-line>Changchun</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Kaitlin Wade, University of Bristol, United Kingdom</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Jie Fu, Shanghai Jiao Tong University, China</p>
<p>Fangzheng Wang, Zhejiang Cancer Hospital, China</p>
<p>Tao Tang, Indiana University, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Xin Jiang, <email xlink:href="mailto:jiangx@jlu.edu.cn">jiangx@jlu.edu.cn</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>04</day>
<month>01</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>13</volume>
<elocation-id>1210807</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>04</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>12</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Zhang, Wang, Tian, Li, Xin and Jiang</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Zhang, Wang, Tian, Li, Xin and Jiang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Evidence supports an observational association between the gut microbiome and susceptibility to extraintestinal cancers, but the causal relationship of this association remains unclear.</p>
</sec>
<sec>
<title>Methods</title>
<p>To identify the specific causal gut microbiota of oral and oropharyngeal cancer, we performed two-sample Mendelian randomization (MR) analysis of gut microbiota on oral and oropharyngeal cancer using a fixed-effects inverse-variance-weighted model. Gut microbiota across five different taxonomical levels from the MiBioGen genome-wide association study (GWAS) were used as exposures. Oral cancer, oropharyngeal cancer and a combination of the two cancers defined from three separate data sources were used as the outcomes. Odds ratios (ORs) and 95% confidence intervals (CIs) for disease per standard deviation (SD) higher abundance of microbiome.</p>
</sec> <sec>
<title>Results &amp; Conclusions</title>
<p>There was little evidence for a causal effect of gut microbiota on oral and oropharyngeal cancer when using a genome-wide p-value threshold for selecting instruments. Secondary analyses using a more lenient p-value threshold indicated that there were 90 causal relationships between 58 different microbial features but that sensitivity analyses suggested that these were possibly affected by violations of MR assumptions and were not consistent across MR methodologies or data sources and therefore are also to unlikely reflect causation. These findings provide new insights into gut microbiota-mediated oral and oropharyngeal cancers and warrant further investigation.</p>
</sec>
</abstract>
<kwd-group>
<kwd>gut microbiome</kwd>
<kwd>oral cancer</kwd>
<kwd>oropharyngeal cancer</kwd>
<kwd>Mendelian randomization</kwd>
<kwd>meta-analysis</kwd>
</kwd-group>
<counts>
<fig-count count="2"/>
<table-count count="1"/>
<equation-count count="2"/>
<ref-count count="40"/>
<page-count count="11"/>
<word-count count="6278"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Extra-intestinal Microbiome</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Head and neck cancer is the sixth most common cancer worldwide (<xref ref-type="bibr" rid="B35">Warnakulasuriya, 2009</xref>), with oral and oropharyngeal cancers being the most common subtypes. Tobacco and alcohol consumption (<xref ref-type="bibr" rid="B14">Hashibe et&#xa0;al., 2009</xref>), human papillomavirus (HPV) infection (<xref ref-type="bibr" rid="B2">Ang et&#xa0;al., 2010</xref>), and specific sexual behaviors (<xref ref-type="bibr" rid="B15">Heck et&#xa0;al., 2010</xref>) have been recognized as oral and oropharyngeal cancer risk factors. Recently, there has been growing recognition of links between cancer and the microbiome; in particular, cancer-associated biomarkers have been observed in the gut microbiome (<xref ref-type="bibr" rid="B10">Cullin et&#xa0;al., 2021</xref>). The gut microbiota is a collection of bacterial species present in the intestinal tract. The roles of gut microbes in tumors can be divided into local and distal roles (<xref ref-type="bibr" rid="B22">Matson et&#xa0;al., 2021</xref>). In addition to the prominent role that specific gut microbes possess in local carcinogenesis, gut microbes can also alter the host&#x2019;s overall immune system, leading to cancer (<xref ref-type="bibr" rid="B9">Castellarin et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B1">Amieva and Peek, 2016</xref>). There is a natural anatomical barrier between intestinal microorganisms and the intestinal epithelium, primarily composed of goblet cells that secrete intestinal mucus (<xref ref-type="bibr" rid="B18">Kim and Ho, 2010</xref>) and Paneth cells that produce antimicrobial peptides (<xref ref-type="bibr" rid="B28">Salzman et&#xa0;al., 2007</xref>). Therefore, the contact between intestinal microorganisms and the immune system is limited. However, specific microorganisms affect the integrity of the gut barrier. When this integrity is disrupted, an increased number of carcinogens circulate through the impaired gut barrier (<xref ref-type="bibr" rid="B27">Rajagopala et&#xa0;al., 2017</xref>); furthermore, inflammation or immunosuppression are induced, playing an indirect role in promoting cancer (<xref ref-type="bibr" rid="B38">Yu and Schwabe, 2017</xref>). An example illustrating this distal role is that the gut microbiota can promote hepatocellular carcinoma and pancreatic cancer growth/progression/invasion and metastasis, which contain no known microbiome, by elevating cancer-promoting inflammatory microbial-associated molecular patterns such as lipopolysaccharides (<xref ref-type="bibr" rid="B11">Dapito et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B24">Ochi et&#xa0;al., 2012</xref>).</p>
<p>The administration of probiotics to regulate the immune system is a potential antitumor strategy (<xref ref-type="bibr" rid="B33">V&#xe9;tizou et&#xa0;al., 2015</xref>). Gut microbes can modulate immunity by regulating the primary and secondary lymphoid organs of the intestinal epithelial barrier, thereby affecting the tumor microenvironment (<xref ref-type="bibr" rid="B13">Gopalakrishnan et&#xa0;al., 2018</xref>). An association between gut microbes and intestinal tumor susceptibility has been previously reported (<xref ref-type="bibr" rid="B36">Yachida et&#xa0;al., 2019</xref>). Gut microbiota have been shown to affect the body&#x2019;s immune response by regulating immune cell function, affecting inflammatory response, regulating immune tolerance (<xref ref-type="bibr" rid="B40">Zhou et&#xa0;al., 2021</xref>), and producing metabolites (<xref ref-type="bibr" rid="B39">Zhang et&#xa0;al., 2019</xref>). However, the causal relationship between the gut microbiota and parenteral tumors, especially oropharyngeal and oral cancers, remains unclear.</p>
<p>Mendelian randomization (MR) is a statistical method used to assess the causal relationship between exposure and outcome, based on instrumental variables (genetic variants) which can be viewed as a natural analog of randomized controlled trials (RCTs). In contrast to traditional gold-standard RCTs, participants are assigned according to their genotype, reducing the impact of reverse causality and confounding factors such as ethical and socioeconomic factors. Therefore, we aimed to investigate whether the gut microbiota is causally related to oral and oropharyngeal cancers using two-sample MR which uses summary-level data, typically from genome-wide association studies (GWASs).</p>
</sec>
<sec id="s2">
<title>Methods</title>
<sec id="s2_1">
<title>Study design and data sources</title>
<p>Our MR analysis used gut microbiota features as the exposure data and oral and oropharyngeal cancer data as the outcome (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). The original investigation was conducted after obtaining ethical approval for each study included in the MR analysis. Genome-wide association study (GWAS) data for the gut microbiota were obtained from the MiBioGen study (<xref ref-type="bibr" rid="B19">Kurilshikov et&#xa0;al., 2021</xref>) and the oral and oropharyngeal cancer data were obtained from the MRC IEU OpenGWAS data resource (<xref ref-type="bibr" rid="B12">Elsworth et&#xa0;al., 2020</xref>). The original oral and oropharyngeal cancers data were released from OncoArray Oral Cavity and Oropharyngeal Cancer Consortium (<xref ref-type="bibr" rid="B20">Lesseur et&#xa0;al., 2016</xref>) and UK Biobank (<xref ref-type="bibr" rid="B8">Burrows et&#xa0;al., 2021</xref>). The MiBioGen consortium includes 24 cohorts and totals 18340 participants. In each cohort, the gut microbiome is analyzed through 16S rRNA sequencing using Illumina platforms (MiSeq or HiSeq), while the participants undergo genotyping using whole-genome SNP arrays. All outcomes were based on European ancestry. Each outcome data source we used contained three outcomes: oral cancer, oropharyngeal cancer, and their combination. The OncoArray study comprised a cohort of 6,034 cases and 6,585 controls. The number of cases and controls in North America were 2549 (42.2% of total cases) and 2522 (38.3% of total controls), respectively. In Europe, 2499 cases (41.4% of total cases) and 2928 controls (44.5% of total controls) were reported. For Hispanic or Latin American, OncoArray included 986 cases (16.3%) and 1135 controls (17.2%). Because our MR Study was limited to European populations and gut microbial exposures were not available with respect to Hispanic or Latin American populations, we therefore excluded outcomes if they were Hispanic or Latin American from the study which were restricted to only those of North American and European ancestry. Given the ethnic diversity, Lesseur et&#xa0;al. evaluated associations within continent (Europe, North and South America) using multivariate unconditional logistic regressions under a log-additive genetic model adjusted for age, sex and regional eigenvectors. Genotyping of 13,107 individuals was conducted using Illumina platforms across 12 epidemiological studies. After rigorous quality control measures, a total of 6,034 cases and 6,585 cancer-free controls were included in the final analysis, 4839 cases and 5257 controls of which were of European decent and therefore were used in this MR analysis. Whole-genome imputation was performed using the Haplotype Reference Consortium panel, resulting in approximately 7 million high-quality imputed variants. The UK Biobank began in 2006 by recruiting approximately 500,000 participants between the ages of 38 and 73. Participants completed a series of questionnaires that provided detailed personal and lifestyle information. In addition, participants provided biospecimens, including blood, urine, and saliva, which were subsequently sequenced for genome sequencing and genotyping using the Illumina sequencing platform in the UK Biobank. Details of outcomes are provided in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. The number of total cases of oral and oropharyngeal cancer combined and controls of the UK Biobank were 839 and 372016, respectively.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The whole workflow of MR analysis.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1210807-g001.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Outcome GWAS samples used in this study.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">GWAS ID</th>
<th valign="top" align="left">Trait</th>
<th valign="top" align="left">Consortium</th>
<th valign="top" align="left">Sample size</th>
<th valign="top" align="left">Number of SNPs</th>
<th valign="top" align="left">Population</th>
<th valign="top" align="left">ncase</th>
<th valign="top" align="left">ncontrol</th>
<th valign="top" align="left">PMID/DOI</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">ieu-b-89</td>
<td valign="top" align="left">Oral cavity and pharyngeal cancer</td>
<td valign="top" align="left">OncoArray oral cavity and oropharyngeal cancer</td>
<td valign="top" align="left">5,425</td>
<td valign="top" align="left">7,514,278</td>
<td valign="top" align="left">European (Geographic region: Europe)</td>
<td valign="top" align="left">2,497</td>
<td valign="top" align="left">2,928</td>
<td valign="top" align="left">27749845</td>
</tr>
<tr>
<td valign="top" align="left">ieu-b-94</td>
<td valign="top" align="left">Oral cavity cancer</td>
<td valign="top" align="left">OncoArray oral cavity and oropharyngeal cancer</td>
<td valign="top" align="left">4,151</td>
<td valign="top" align="left">7,510,833</td>
<td valign="top" align="left">European (Geographic region: Europe)</td>
<td valign="top" align="left">1,223</td>
<td valign="top" align="left">2,928</td>
<td valign="top" align="left">27749845</td>
</tr>
<tr>
<td valign="top" align="left">ieu-b-96</td>
<td valign="top" align="left">Oropharyngeal cancer</td>
<td valign="top" align="left">OncoArray oral cavity and oropharyngeal cancer</td>
<td valign="top" align="left">4,018</td>
<td valign="top" align="left">7,508,444</td>
<td valign="top" align="left">European (Geographic region: Europe)</td>
<td valign="top" align="left">1,090</td>
<td valign="top" align="left">2,928</td>
<td valign="top" align="left">27749845</td>
</tr>
<tr>
<td valign="top" align="left">ieu-b-90</td>
<td valign="top" align="left">Oral cavity and pharyngeal cancer</td>
<td valign="top" align="left">OncoArray oral cavity and oropharyngeal cancer</td>
<td valign="top" align="left">4,671</td>
<td valign="top" align="left">7,510,261</td>
<td valign="top" align="left">European (Geographic region: North America)</td>
<td valign="top" align="left">2,342</td>
<td valign="top" align="left">2,329</td>
<td valign="top" align="left">27749845</td>
</tr>
<tr>
<td valign="top" align="left">ieu-b-93</td>
<td valign="top" align="left">Oral cavity cancer</td>
<td valign="top" align="left">OncoArray oral cavity and oropharyngeal cancer</td>
<td valign="top" align="left">3,464</td>
<td valign="top" align="left">7,506,142</td>
<td valign="top" align="left">European (Geographic region: North America)</td>
<td valign="top" align="left">1,135</td>
<td valign="top" align="left">2,329</td>
<td valign="top" align="left">27749845</td>
</tr>
<tr>
<td valign="top" align="left">ieu-b-97</td>
<td valign="top" align="left">Oropharyngeal cancer</td>
<td valign="top" align="left">OncoArray oral cavity and oropharyngeal cancer</td>
<td valign="top" align="left">3,448</td>
<td valign="top" align="left">7,506,485</td>
<td valign="top" align="left">European (Geographic region: North America)</td>
<td valign="top" align="left">1,119</td>
<td valign="top" align="left">2,329</td>
<td valign="top" align="left">27749845</td>
</tr>
<tr>
<td valign="top" align="left">ieu-b-4962</td>
<td valign="top" align="left">Oral and oropharyngeal cancer</td>
<td valign="top" align="left">UK Biobank</td>
<td valign="top" align="left">372,855</td>
<td valign="top" align="left">9,185,233</td>
<td valign="top" align="left">European</td>
<td valign="top" align="left">839</td>
<td valign="top" align="left">372,016</td>
<td valign="top" align="left">10.5523/bris.aed0u12w0ede20olb0m77p4b9</td>
</tr>
<tr>
<td valign="top" align="left">ieu-b-4961</td>
<td valign="top" align="left">Oral cavity cancer</td>
<td valign="top" align="left">UK Biobank</td>
<td valign="top" align="left">372,373</td>
<td valign="top" align="left">7,723,107</td>
<td valign="top" align="left">European</td>
<td valign="top" align="left">357</td>
<td valign="top" align="left">372,016</td>
<td valign="top" align="left">10.5523/bris.aed0u12w0ede20olb0m77p4b9</td>
</tr>
<tr>
<td valign="top" align="left">ieu-b-4968</td>
<td valign="top" align="left">Oropharyngeal cancer</td>
<td valign="top" align="left">UK Biobank</td>
<td valign="top" align="left">372,510</td>
<td valign="top" align="left">8,283,869</td>
<td valign="top" align="left">European</td>
<td valign="top" align="left">494</td>
<td valign="top" align="left">372,016</td>
<td valign="top" align="left">10.5523/bris.aed0u12w0ede20olb0m77p4b9</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>GWAS, Genome-wide association study; ncase, Number of case; ncontrol, Number of control; PMID, ID of study in Pubmed; DOI, Digital Object Identifier.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s2_2">
<title>Selection of instrumental variables</title>
<p>We initially extracted instrumental variables using a genome-wide association study p-value threshold of 5e-08. Subsequently, Kurilshikov et&#xa0;al. identified a total of 30 quantitative SNP-feature associations through mbQTL analysis (<xref ref-type="bibr" rid="B19">Kurilshikov et&#xa0;al., 2021</xref>). After conducting the main Mendelian randomization (MR) analysis for these exposures, we further performed a secondary analysis using a more lenient threshold criteria, specifically, we extracted five levels of GWAS summary data of exposure (phylum, class, order, family, and genus) derived from MiBioGen, where the number of features were 9, 16, 20, 35, and 131 respectively. Single-nucleotide polymorphisms (SNPs) smaller than the p-value threshold within the locus-wide range (1 &#xd7; 10<sup>-5</sup>) were selected as instrumental variables according to a previous study (<xref ref-type="bibr" rid="B29">Sanna et&#xa0;al., 2019</xref>). One MR principle is that there is no linkage disequilibrium (LD) between the included instrumental variables, as a strong LD may lead to biased results, for strong LD may bias the results by genetic confounding or overestimating the association between the genetic variants used and the exposure and outcome. In this study, the SNPs were clumped within each phenotype, clumping processing (R<sup>2</sup>&lt; 0.1, clumping distance = 500 kb) (<xref ref-type="bibr" rid="B23">Ni et&#xa0;al., 2021</xref>) was performed to evaluated LD among the SNPs used to instrument each phenotype separately, where SNPs in LD were removed and the strongest (i.e., that with the smallest p-value) was retained for MR analyses.</p>
</sec>
<sec id="s2_3">
<title>Assumptions</title>
<p>The two-sample MR study relies on three critical assumptions to minimize bias. First, the genetic instruments used were robustly associated with exposure. Second, there is no confounding factor between the instrument and the outcome. Third, instrumental variables affected the outcomes only through exposure, meaning that there was no horizontal pleiotropy effect between instrumental variables and outcomes.</p>
</sec>
<sec id="s2_4">
<title>Statistical methods and multiple testing correction</title>
<p>When combining summarized data on genetic associations, it is necessary to ensure that genetic associations are expressed per additional copy of the same allele. If a genetic variant is a biallelic single nucleotide polymorphism (SNP) with alleles A and G on the positive strand, then the corresponding base pairs on the negative strand will be T and C. In this case, one dataset may report the association per additional copy of the A allele, and another per additional copy of the T allele &#x2013; but the same comparison is being made. Allele and strand information can be double-checked by comparing allele frequency information &#x2013; if the allele frequencies are similar for the A and T alleles, this means that this is a strand mismatch. For palindromic variants &#x2013; if the alleles were A and T (or C and G), then the same alleles would appear on both the positive and negative strands. In such a case, if the allele frequency is close to 50%, it may be necessary to drop the variant from the analysis if it is not possible to verify that the alleles have been correctly orientated. While this is a conservative recommendation, allele alignment problems have led to incorrect results in MR analyses. Therefore, palindromic SNPs with intermediate (i.e., 0.42%) frequencies were discarded. Analytical methods used included the Wald ratio and inverse variance weighted (IVW) estimators (<xref ref-type="bibr" rid="B5">Burgess et&#xa0;al., 2013</xref>). The Wald ratio estimates the causal effect of the exposure on the outcome using a single instrumental variable (IV). When horizontal pleiotropy is absent, IVW results are considered robust. In general, the Wald ratio was used for the analysis with only one SNP and the IVW method was used for the analysis with multiple SNPs The IVW has the strictest assumptions; therefore, this method was considered the main analytical method, to which results from all other methods were compared. Effect estimates and 95% confidence intervals (CIs) reflect the odds ratios (ORs) for disease per standard deviation (SD) higher abundance of microbiome.</p>
<p>In our study, we chose not to apply multiple testing correction in both primary and secondary analyses due to the complex interactions and correlations among microbial features. Although multiple testing correction is common in many studies, we believe that it might be overly stringent in this context, potentially obscuring true causal relationships. This decision is grounded in the complexity of the microbial ecosystem, where microbes often influence each other. Given these interactions, applying multiple testing correction to each microbial feature may be overly conservative and might obscure some signals that have genuine causal relationships.</p>
</sec>
<sec id="s2_5">
<title>Colocalization analysis</title>
<p>Colocalization analysis is commonly employed to ascertain whether two phenotypes are driven by the same causal variant within a particular genomic region, thereby bolstering evidence for the association between the two phenotypes. For colocalisation analyses, we extracted SNPs that fell within a 500 kb window upstream and downstream of the SNP used as an instrument for the microbial feature from both the microbiome and oral cancer GWAS datasets. To be more specific, we acquired GWAS summary data from the MRC IEU OpenGWAS data resource. Using the SNPs extracted during the primary MR analysis, we queried their chromosomal number and position within the PheWAS - IEU OpenGWAS project (mrcieu.ac.uk). With this positional information, we adjusted the numerical value by either adding or subtracting 500,000 to establish a positional range spanning 500kb upstream and downstream. With the chromosome number and positional range, we then conducted a filter operation on the GWAS summary data previously downloaded, resulting in the final selection of SNPs located within a 500kb radius both up and downstream of the instrument. The number of extracted SNPs is shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;2</bold>
</xref>.</p>
<p>Specifically, we used the SNP positions that satisfy the threshold criteria and fall within a 500 kb window upstream and downstream as candidate SNPs for extraction in both exposure and outcome traits for colocalization analysis. Colocalization analysis involves five mutually exclusive model assumptions, namely: H0: no association exists between all SNP loci within a genomic region and both the exposure and outcome; H1/H2: significant association exists between the exposure/outcome, respectively, and SNP loci within a genomic region; H3: association exists between both exposure and outcome and SNP loci within a genomic region, driven by distinct causal variants; H4: association exists between both exposure and outcome and SNP loci within a genomic region, driven by the same causal variant. During the colocalization analysis, posterior probabilities (PP.H0-PP.H4) are generated for each of these models. The sum of the posterior probabilities for the five models equals 1.&#xa0;A higher posterior probability for a specific model indicates a higher likelihood of that model assumption being valid given the data. We considered the model assumption to be valid when the posterior probability of that model was greater than 0.80. Priors are as follows: p1: prior probability a SNP is associated with microbiome trait, default is 1e-4; p2: prior probability a SNP is associated with outcome, default is 1e-4; p12: prior probability a SNP is associated with both exposure and outcome, default is 1e-5.</p>
<p>Our colocalization analysis was based on any result obtained from the primary MR analysis that suggested a causal effect of an exposure the OncoArray outcomes. First, we identified SNPs within a 500kb range for both exposure and outcome, and then merged the data based on their rsID, aligning effect alleles. We calculated the variance (VAR) after splitting and cleaning the data by removing missing values, specifying phenotype types: binary phenotype as &#x201c;cc&#x201d; (for outcomes) and continuous phenotype as &#x201c;quant&#x201d; (for exposure). We conducted colocalization analysis using the &#x201c;coloc&#x201d; package and generated locus zoom plots using the &#x201c;locuscompare&#x201d; package.</p>
</sec>
<sec id="s2_6">
<title>Assessment of assumptions</title>
<p>We approximated the variance explained in each gut microbial trait by the respective associated genetic instruments using the following <xref ref-type="disp-formula" rid="eq1">Equation 1</xref> (<xref ref-type="bibr" rid="B30">Shim et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B25">Papadimitriou et&#xa0;al., 2020</xref>):</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>(</mml:mi>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>E</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>F</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>(</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>E</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mi>)</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>b</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>t</mml:mi>
<mml:msup>
<mml:mi>a</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mi>)</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>E</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>F</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mfenced>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>E</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>F</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>b</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>t</mml:mi>
<mml:msup>
<mml:mi>a</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>+</mml:mo>
<mml:mfenced>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>E</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>F</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mfenced>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>E</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>F</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>S</mml:mi>
<mml:msup>
<mml:mi>E</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In this context, EAF represents the frequency of the effect allele, beta signifies the estimated genetic impact on exposure, N stands for the sample size of the GWAS concerning the association between the SNP and exposure, and SE represents the standard error of the genetic effect. Since EAF was not available for raw data on gut microbes, we inquired the allele frequency (GRCh37) of each SNP through the 1000 genome project (<ext-link ext-link-type="uri" xlink:href="https://www.internationalgenome.org/1000-genomes-browsers/index.html">https://www.internationalgenome.org/1000-genomes-browsers/index.html</ext-link>). The power of our MR analyses was assessed using the online calculator mRnd (<ext-link ext-link-type="uri" xlink:href="https://shiny.cnsgenomics.com/mRnd/">https://shiny.cnsgenomics.com/mRnd/</ext-link>).</p>
</sec>
<sec id="s2_7">
<title>Sensitivity analyses</title>
<p>Maximum likelihood (<xref ref-type="bibr" rid="B26">Pierce and Burgess, 2013</xref>), MR-Egger (<xref ref-type="bibr" rid="B3">Bowden et&#xa0;al., 2015</xref>), weighted median (<xref ref-type="bibr" rid="B4">Bowden et&#xa0;al., 2016</xref>), weighted mode, and MR-PRESSO (<xref ref-type="bibr" rid="B32">Verbanck et&#xa0;al., 2018</xref>) were used to infer potential causality. The Maximum likelihood (ML) method bears resemblance to IVW, provided there is no presence of heterogeneity and horizontal pleiotropy. If these assumptions hold true, the outcomes will remain unbiased, and the standard errors will be smaller compared to IVW (<xref ref-type="bibr" rid="B37">Yavorska and Burgess, 2017</xref>). We used the MR-Egger intercept term to assess pleiotropy. In the presence of horizontal pleiotropy, the MR-Egger effect estimate is a more accurate representation of the unbiased causal effect. If this intercept term was close to zero, then the MR-Egger regression model would be similar to the IVW model. However, if the intercept term was different from zero, it indicates that there may have been horizontal pleiotropy among these IVs. The weighted median can provide consistent estimates of causal effects, providing&lt;50% of SNPs are invalid. We assessed the robustness of the results using sensitivity analysis and tested heterogeneity using Cochran&#x2019;s Q-test in the IVW test and MR-Egger regression. We conducted MR-PRESSO tests to correct for horizontal pleiotropic effect by removing the IV outliers. MR-Egger regression was used to estimate the effect of pleiotropy; it produced a more robust pleiotropy-corrected causal estimate under the assumptions of no measurement error and instrument strength independent of direct effects (<xref ref-type="bibr" rid="B7">Burgess and Thompson, 2017</xref>). Leave-one-out analysis was used to determine whether the original causal effect was driven by a single SNP. We also used the MR Steiger test to examine evidence for directionality in the relationship (i.e., that the exposure caused the outcome rather than the reverse) by comparing the variance explained in the exposure and outcome by the exposure-related IV (<xref ref-type="bibr" rid="B16">Hemani et&#xa0;al., 2017</xref>). Furthermore, we assessed instrument strength using the F statistic (<xref ref-type="bibr" rid="B6">Burgess and Thompson, 2011</xref>), calculated using the <xref ref-type="disp-formula" rid="eq2">Equation 2</xref>:</p>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mtext>F</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mi>(</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>k</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>)</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mfenced>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where R<sup>2</sup> represents the variance of exposure explained by the selected SNPs, N is the sample size, and k represents the number of instrumental variables. If F&lt; 10, indicating a higher likelihood of weak instrument bias, the association between instrumental variables and exposure was considered weak.</p>
</sec>
<sec id="s2_8">
<title>Meta-analyses</title>
<p>We had three outcome datasets: OncoArray (including North American and European individuals treated as separate data sources) and the UK Biobank. The meta-analysis involved meta-analysing the IVW-specific estimates of the microbial features on the same outcomes across different datasets. The meta-analysis employed both a random-effects model and a fixed-effects model, and was conducted using the meta-package in R. Heterogeneity between studies was assessed using I<sup>2</sup> and associated p-value. We first determined whether the direction of the effect size for each microbial feature was consistent across the different methods within each data source. If the direction was consistent across methods, we conducted a meta-analysis. If the effect size direction for a particular microbial feature differed among methods for any of the three data sources, then meta-analysis was not performed for that microbial feature.</p>
</sec>
<sec id="s2_9">
<title>Software and pre-registration</title>
<p>Analysis was performed using R software (version 4.0.2; R Foundation for Statistical Computing, Vienna, Austria), with the R packages &#x201c;TwoSampleMR&#x201d; (version 0.5.6) (<xref ref-type="bibr" rid="B17">Hemani et&#xa0;al., 2018</xref>) and &#x201c;MRPRESSO&#x201d; (<xref ref-type="bibr" rid="B32">Verbanck et&#xa0;al., 2018</xref>). We followed STROBE-MR (guidelines for strengthening the reporting of observational studies in epidemiological studies using MR to report our results (<xref ref-type="bibr" rid="B31">Skrivankova et&#xa0;al., 2021</xref>).</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Primary MR analysis</title>
<p>We employed a genome-wide association study p-value threshold of 5e-08 to extract instrumental variables. Our results are consistent with those of Kurilshikov et&#xa0;al., as a total of 30 SNPs associated with 27 microbial phenotypes were extracted (<xref ref-type="bibr" rid="B19">Kurilshikov et&#xa0;al., 2021</xref>). Among these, genus <italic>Intestinibacter</italic>, genus <italic>RuminococcaceaeUCG009</italic>, and genus <italic>CandidatusSoleaferrea</italic> yielded one extracted SNP each (rs10805326, rs8009993, and rs830151, respectively), yet no corresponding SNP was found in the outcome. Conversely, for genus <italic>Peptococcus</italic>, genus <italic>Enteror-habdus</italic>, genus <italic>Ruminococcus1</italic>, and genus <italic>Faecalibacterium</italic>, the sole SNPs (rs75754569, rs11098863, rs10769159, and rs12320842, respectively) were discarded for being palindromic with intermediate allele frequencies.</p>
<p>We proceeded to perform MR analysis on the remaining 20 gut microbial features. Wald ratio results indicated that order <italic>Gastranaerophilales</italic>, family <italic>Gastranaerophilales</italic>, and genus <italic>Gastranaerophilales</italic> exhibited carcinogenic effects on oral and oropharyngeal cancer in the North American population from OncoArray with odds ratios (ORs) per standard deviation (SD) higher abundance of 2.610 [1.124-6.061] (oral and oropharyngeal cancer) and 3.609 [1.232-10.568] (oropharyngeal cancer). However, these effects were inconsistent across multiple data sources, as the causal effect directions of order <italic>Gastranaerophilales</italic>, family <italic>Gastranaerophilales</italic>, and genus <italic>Gastranaerophilales</italic> varied across different data sources (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>). Subsequently, we conducted colocalization analysis on these 30 SNPs, revealing that none of the PP.H4 values exceeded 0.80, providing limited evidence in support of the hypothesis that &#x201c;exposure and outcome are associated with SNP loci within a genomic region, driven by the same causal variant.&#x201d;(<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;2</bold>
</xref>) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;1</bold>
</xref>).</p>
</sec>
<sec id="s3_2">
<title>Secondary MR analysis</title>
<p>Subsequently, we conducted analyses using a more lenient p-value threshold. We extracted five levels of GWAS summary data on exposure derived from MiBioGen. After the removal of palindromic SNPs, clumping, and harmonization of the data, the number of SNPs associated with the microbial traits that were available in the outcome data ranged from 4 to 22; the microbial trait associated with the fewest SNPs was the genus <italic>Hungatella</italic>, with four SNPs extracted, and the microbial trait associated with the most SNPs was the class <italic>Actinobacteria</italic>, with 22 SNPs extracted (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;3</bold>
</xref>). The R<sup>2</sup> and F-statistic values for the exposures are summarized in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;4</bold>
</xref>. The R<sup>2</sup> values for all SNPs of exposure were greater than the corresponding R<sup>2</sup> for the SNPs of the outcome. The F-statistics for all exposures were greater than 10, indicating little evidence for weak instrument bias, which demonstrated that all SNPs had sufficient validity.</p>
<p>A secondary MR analysis provided evidence for causal relationships between 90 (includes 58 microbiota signatures) and oral cancers across the three data sources. There were 13, 15, and 17 microbiota features that caused a change in risk of oral cancer, oropharyngeal cancer, and combined oral and oropharyngeal cancer in the European population, respectively (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;2-13</bold>
</xref>), and nine, three, and eight microbiota features that caused a change in risk of oral cancer, oropharyngeal cancer, and combined oral and oropharyngeal cancer in the North American population, respectively (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;14-25</bold>
</xref>). The number of features that possessed causal relationships with oral cancer, oropharyngeal cancer, and combined oral and oropharyngeal cancer in the UK Biobank data were 10, 5, and 10, respectively (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;26-37</bold>
</xref>) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;3</bold>
</xref>).</p>
<p>We present the results of microbiota signatures with causal effects on oral or oropharyngeal cancer in combined oral and oropharyngeal cancer data, for these estimates were consistent in terms of direction of effect in all methods. For the European region, genus <italic>Hungatella</italic> (OR=2.735, [1.565;4.78] (Oropharyngeal cancer)), and <italic>Parabacteroides</italic> were risk factors, whereas the genus <italic>Alistipes</italic> and <italic>Eubacterium coprostanoligenes</italic> group, phylum <italic>Lentisphaerae</italic> (OR=0.448, [0.292;0.686] (Oropharyngeal cancer)), class <italic>Lentisphaeria</italic>, and order <italic>Victivallales</italic> were protective factors (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Features that causally associated with oral and oropharyngeal cancer of OncoArray and UK Biobank.<bold>(A)</bold> Forest plot of features that causally associated with Oral and oropharyngeal cancer of OncoArray; <bold>(B)</bold> Forest plot of features that causally associated with Oral and oropharyngeal cancer of UK Biobank.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1210807-g002.tif"/>
</fig>
<p>In North American populations, one protective factor (genus <italic>Butyrivibrio</italic>) (OR=0.784, [0.619;0.991] (Oral cavity and oropharyngeal cancer)), and one risk factor (genus <italic>Eubacterium xylanophilum group</italic>) (OR=2.223, [1.129;4.376] (Oral cavity cancer)) were causally associated with combined oral and oropharyngeal cancers and oral or oropharyngeal cancer (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>).</p>
<p>In the UK Biobank data, there were seven microbial characteristics were associated with outcomes, among which class <italic>Betaproteobacteria</italic>, order <italic>Burkholderiales</italic>(OR=1.001, [1.000;1.002] (Oral cavity cancer)) were risk factors, whilst class <italic>Actinobacteria</italic>, family <italic>Bifidobacteriaceae</italic>, genus <italic>Bifidobacterium</italic>(OR=0.998, [0.998;0.999](Oral and oropharyngeal cancer)) and <italic>Butyrivibrio</italic>, and order <italic>Bifidobacteriales</italic> were protective factors. (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>).</p>
<p>Unfortunately, none of the signatures were consistent across the three data sources. However, there were 7 signatures that were consistent across the two data sources, including class <italic>Lentisphaeria</italic> (European region and North American region of OncoArray), genus <italic>Butyrivibrio</italic> (North American region of OncoArray and UK Biobank), order <italic>Bacillales</italic> (European region of OncoArray and UK Biobank), order <italic>Bifidobacteriales</italic> (European region of OncoArray and UK Biobank), order <italic>Burkholderiales</italic> (North American region of OncoArray and UK Biobank), order <italic>Victivallales</italic> (European region and North American region of OncoArray), family <italic>Bifidobacteriaceae</italic> (European region of OncoArray and UK Biobank). We compared the direction of the resulting effect size for the 20 exposures in the main analysis with the direction of the effect size obtained after the use of the lenient threshold criteria. Among the 180 causal relationships examined, 113 exhibited consistent effect directions in the secondary MR analysis following lenient threshold criteria. Of the 20 phenotypes assessed in the main analysis, none had directionally consistent effect estimates across main and secondary analyses across all methods in 9 outcomes. Notably, genus <italic>Tyzzerella3</italic> and genus <italic>Romboutsia</italic> maintained consistent directions for 8 effect estimates after the secondary analysis. The direction of effect for Gastranaerophilales on oral cavity and pharyngeal cancer and oropharyngeal cancer (Both from North American region of OncoArray) was the same as the direction of effect for Gastranaerophilales in the secondary analysis across all methods (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>).</p>
</sec>
<sec id="s3_3">
<title>Sensitivity analyses</title>
<p>The results of Cochran&#x2019;s Q test suggested that there was little evidence of heterogeneity, where all p-values were greater than 0.05. The horizontal pleiotropy between instrumental variables and outcomes was assessed using the MR-Egger regression. There was little evidence of horizontal pleiotropy was found (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;4</bold>
</xref>). MR-PRESSO global test results showed the presence of outliers only in the genus <italic>Veillonella</italic> analysis of Oral and oropharyngeal cancer (UK Biobank). After excluding outliers, the MR-PRESSO results showed that there was no evidence for a causal effect of <italic>Veillonella</italic> on either cancer. Additionally, the leave-one-out analysis showed that none of the identified causal associations were driven by any single IV. (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures&#xa0;2&#x2013;37</bold>
</xref>).</p>
<p>In our secondary MR Analysis, 18 causal relationships (17 microbial traits) were found to be inconsistent in the direction of causal effects among different methodologies (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;3</bold>
</xref>), so these causal relationships were excluded from the subsequent meta-analysis. There were 72 causal relationships (50 microbial traits) in the same direction of causal effects across methodologies (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;3</bold>
</xref>).</p>
<p>We performed the MR Steiger directionality test to determine whether there was evidence that the assumed direction of causality was correct. All Steiger test p-values were less than 0.05, suggesting that the assumed direction of effect from the gut microbiome to oral and oropharyngeal cancers was correct, except for the genus <italic>Hungatella</italic> on oropharyngeal cancer (Steiger <italic>P</italic>-value=0.32). However, the R<sup>2</sup> of exposure SNPs was greater than that of the outcome, suggesting that all causal directions were correct.</p>
</sec>
<sec id="s3_4">
<title>Meta-analysis</title>
<p>For class <italic>Lentisphaeria</italic>, genus <italic>Butyrivibrio</italic>, genus <italic>Ruminococcus 2</italic>, order <italic>Victivallales</italic>, and phylum <italic>Lentisphaerae</italic> consistently aligned with the MR methods, and therefore, estimates of the effect of these microbial features on oral and oropharyngeal cancer from all three data sources were included in the meta-analysis. Our results showed that there was limited evidence suggesting a causal effect of any microbial feature on oral and oropharyngeal cancer in the meta-analysis (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;5</bold>
</xref>). Next, we conducted a meta-analysis for oral cancer outcomes, using the same criteria as before. Although genus <italic>Eubacterium xylanophilum group</italic>, genus <italic>Parabacteroides</italic>, and genus <italic>Ruminococcus gauvreauii group</italic> consistently aligned with the MR methods, the meta-analysis results provided little evidence for causal effects (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;6</bold>
</xref>).</p>
<p>Only the estimates of genus Ruminococcaceae UCG010 were consistent in direction across all methods in individual data sources, therefore, the meta-analysis was conducted with this one microbial feature. Results showed little evidence for a causal effect of Ruminococcaceae UCG010 on oropharyngeal cancer (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;7</bold>
</xref>).</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>In the current study, we performed MR analyses to assess causal effect of gut microbial signatures on oral and oropharyngeal cancer. Firstly, the main analysis is where instruments have been selected based on a genome-wide p-value threshold. Although the initial analysis found a causal association between genus <italic>Gastranaerophilales</italic> and oropharyngeal cancer, despite initial analyses suggesting a causal effect, colocalisation analyses implied that these results are unlikely reflective of causality. Although we lowered the criteria for the extraction of instrumental variables and obtained 58 microbiota features with possible causal associations in secondary MR analysis, after meta-analysis of the 9 microbial features across each data source was consistent among different methods, random effects model showed limited evidence of causal effects. In addition, the main results of the meta-analysis were derived from secondary MR with lenient threshold criteria, which is likely biased given the lack of robust associations between instruments and the exposure. Therefore, based on the results of our primary MR analysis and colocalization analysis, which is a requirement for causality, we believe that the current evidence does not yet support the causal association of gut microbiota characteristics with oral and oropharyngeal cancer.</p>
<p>Whilst we were unable to provide strong evidence of horizontal pleiotropy in these analyses, it is possible (and likely) that the instruments we used may still be pleiotropic. While our outcome data originated from a sample of European individuals, it&#x2019;s crucial to note that the MiBioGen data exhibit mixed ancestry, introducing the possibility of violating the second MR assumption due to genetic confounding. To establish causality, addressing confounding becomes imperative, wherein a third variable influences both exposure and outcome, creating a noncausal association. Genetic confounding is a nuanced scenario wherein genetic factors serve as this influential third variable. The inherent complexity of gene inheritance in organisms poses a challenge, making it arduous to fully isolate or control for the specific effects of individual genes, rendering the adjustment for genetic confounding difficult.</p>
<p>We observed that original data for microbial features under the same taxonomic classification (class <italic>Lentisphaeria</italic>-order <italic>Victivallales</italic>) and (order <italic>Bifidobacteriales</italic>-family <italic>Bifidobacteriaceae</italic>) were entirely identical, yielding the same OR values. This convergence could be attributed, on one hand, to potential characteristic dominant species within the same taxonomic classification, resulting in data congruence between the upper and lower taxonomic levels. On the other hand, order <italic>Bifidobacteriales</italic> predominantly segregates into family <italic>Bifidobacteriaceae</italic> and family <italic>Gardnerellaceae</italic>, with the latter recognized for its presence in maintaining vaginal microbial equilibrium in female reproductive tracts. Given that our exposure data were sourced from gut microbiota, data congruence between order <italic>Bifidobacteriales</italic> and family <italic>Bifidobacteriaceae</italic> was plausible. We opted for data representation at relatively lower taxonomic levels and refrained from analyzing analogous microbial features as independent exposures. For instance, we selected order <italic>Victivallales</italic> from (class <italic>Lentisphaeria</italic> and order <italic>Victivallales</italic>) and family <italic>Bifidobacteriaceae</italic> from (order <italic>Bifidobacteriales</italic> and family <italic>Bifidobacteriaceae</italic>) to curtail redundancy.</p>
<p>Understanding the causal relationship between gut microbiota and oral and oropharyngeal cancers can help guide decisions on health management and disease prevention strategies. Because GWAS data for the oral microbiome are unavailable, and oral microbiota has a more diverse and dynamic bacterial community than gut microbiota (<xref ref-type="bibr" rid="B21">Maki et&#xa0;al., 2021</xref>). Therefore, we selected the largest currently published GWAS for the gut microbiome from the MiBioGen consortium. Our study validated the features of the gut microbiota associated with cancer susceptibility. We performed analyses both with the genome-wide p-value threshold and with a more lenient p-value threshold, as a secondary analysis. Whilst extracted instrumental variables that did not meet the traditional genome-wide p-value threshold may very likely lead to weak instrument bias and violate core MR assumptions, the use of a lenient p-value threshold allowed the application of pleiotropy-robust methods in sensitivity analyses. And for those results with different causal directions from different MR methods, only those results with the same causal direction from all methods were reported. We assessed weak instrument bias through F-statistics and found little evidence for weak instruments. However, even if the F-statistic is greater than 10, instrumental variables may still be ineffective, as they could exhibit a high degree of pleiotropy (wherein ineffective instruments can still yield a high F-statistic) (<xref ref-type="bibr" rid="B34">Wade and Hall, 2019</xref>). Instrumental variables might be associated with outcomes through various channels, leading to violations of MR assumptions if independent from the exposure. We cannot rule out this possibility in our analysis. In addition to the pleiotropy-robust methods, the MR Steiger directionality test was used to test for the causal direction of effect and, in almost all causes, it provided evidence that the assumed causal direction (i.e., from the exposure to outcome) was correct. The genus <italic>Hungatella</italic> failed to pass, that is, it did not provide enough evidence to support the direction of causality. Therefore, genus <italic>Hungatella</italic> cannot be considered to have a causal effect on oropharyngeal cancer.</p>
<p>Moreover, augmenting the study&#x2019;s sample size holds the potential to enhance statistical power, thereby elevating the probability of identifying associations. Larger sample sizes contribute to more accurate estimates and diminish p-values. The observed disparity in the significance of the association between a gut microbiome feature, as indicated by Oncoarray versus UK Biobank, may stem from variations in sample size. Despite the notably extensive size of the UK Biobank dataset, the proportion of cases within the total sample remains relatively modest. This discrepancy could have compromised statistical power, conceivably masking authentic effect signals that might otherwise be discernible. In addition, the MR-Egger method is sensitive to horizontal pleiotropy, that is, genetic variation affects the outcome independent of the exposure. Although the p value of the MR-Egger intercept in our study was greater than 0.05, there was indeed an unbalanced pleiotropic effect in our secondary analysis.</p>
<p>In our secondary MR results, the genus <italic>Intestinibacter</italic>, <italic>Ruminiclostridium5</italic>, and the order <italic>Rhodospirillales</italic> exhibited causal effect estimates using the MR-Egger method that differed in direction from those obtained through other methods (IVW, Maximum Likelihood, Weighted Median, etc.), suggesting violations of MR assumptions. The difference in power limitations between the MR-Egger estimator and other MR methods stems from the fact that the former estimates two parameters &#x2013; the causal effect and the degree of unbalanced pleiotropy &#x2013; whereas other methods focus solely on estimating the singular parameter, the causal effect. While our sensitivity analysis did not reveal the presence of pleiotropy, the results for these specific microbial features suggest a potential underlying pleiotropy. Additionally, several other microbial features displayed varying causal effects across different data sources, such as the family <italic>Prevotellaceae</italic> and the orders <italic>Bacillales</italic> and <italic>Burkholderiales</italic>. The family <italic>Prevotellaceae</italic> demonstrated a risk factor for oral and oropharyngeal cancer in European populations while being protective in North American populations. We hypothesize that these variations in the impact of these microbial features on oral and oropharyngeal cancer between North American and European populations could stem from differences in dietary habits and lifestyles, or potentially environmental influences on microbial composition and functionality. Furthermore, the sample size and diversity of the microbial communities under study could affect the stability of results. The divergence in outcomes between different regions could possibly be attributed to factors such as higher microbial diversity. However, our study&#x2019;s primary objective was to explore microbial features associated causally with the occurrence of oral and oropharyngeal cancer in European populations. At present, there are no reports on variations in the effects of regional microbial features on oral and oropharyngeal cancer. Therefore, our interpretation of potential reasons for the differing impacts can only be approached with caution.</p>
<p>In our study, we&#x2019;ve chosen not to apply multiple testing correction in the primary and secondary analyses due to the complex interactions and correlations among microbial features. While multiple testing correction is common, we believe it might be overly strict in this context, potentially hiding true causal relationships. We acknowledge this as a limitation and recommend future research to explore these interactions, develop precise statistical methods, and conduct larger studies for validation.</p>
<p>Our study initially provided evidence that features of the gut microbiome may influence oral and oropharyngeal cancers. However, due to likely violations of core MR assumptions and heterogeneity across both different methodologies that test those assumptions and across data sources of the same outcomes, our results indicate that gut microbiota may not play an important role in the development of oral and oropharyngeal cancers. In conclusion, we comprehensively evaluated the potential causal relationship between the gut microbiota and oral and oropharyngeal cancers. This study provides new insights into the mechanisms of microbial-mediated oral and oropharyngeal cancer development.</p>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://gwas.mrcieu.ac.uk/">https://gwas.mrcieu.ac.uk/</ext-link>.</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>Conceptualization, YX and XJ. Methodology, QZ. Software, QZ. Validation, YX and JX. Formal analysis, HW. Investigation, YT. Resources, XJ. Data curation, JL. Writing-original draft preparation, QZ and HW. Visualization, XJ. Supervision, XJ. Project administration, XJ. Funding acquisition, XJ and YX. All authors contributed to the article and approved the submitted version.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This research was funded by the Jilin Provincial Science and Technology Foundation (grant numbers 20210509003RQ and 20210402002GH), the Achievement Transformation Guiding Foundations of The First Hospital of Jilin University (grant number CGZHYD202012-029).</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We would like to thank Editage (<ext-link ext-link-type="uri" xlink:href="http://www.editage.cn">www.editage.cn</ext-link>) for English language editing.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fcimb.2023.1210807/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fcimb.2023.1210807/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table_1.xlsx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_2.xlsx" id="ST2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_3.xlsx" id="ST3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_4.xlsx" id="ST4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_5.xlsx" id="ST5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_6.xlsx" id="ST6" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_7.xlsx" id="ST7" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Presentation_1.pptx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amieva</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Peek</surname> <given-names>R. M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Pathobiology of helicobacter pylori-induced gastric cancer</article-title>. <source>Gastroenterology</source> <volume>150</volume> (<issue>1</issue>), <fpage>64</fpage>&#x2013;<lpage>78</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1053/j.gastro.2015.09.004</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ang</surname> <given-names>K. K.</given-names>
</name>
<name>
<surname>Harris</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wheeler</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Weber</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Rosenthal</surname> <given-names>D. I.</given-names>
</name>
<name>
<surname>Nguyen-T&#xe2;n</surname> <given-names>P. F.</given-names>
</name>
<etal/>
</person-group>. (<year>2010</year>). <article-title>Human papillomavirus and survival of patients with oropharyngeal cancer</article-title>. <source>N Engl. J. Med.</source> <volume>363</volume> (<issue>1</issue>), <fpage>24</fpage>&#x2013;<lpage>35</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1056/NEJMoa0912217</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bowden</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Davey Smith</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Burgess</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Mendelian randomization with invalid instruments: effect estimation and bias detection through Egger regression</article-title>. <source>Int. J. Epidemiol.</source> <volume>44</volume> (<issue>2</issue>), <fpage>512</fpage>&#x2013;<lpage>525</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/ije/dyv080</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bowden</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Davey Smith</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Haycock</surname> <given-names>P. C.</given-names>
</name>
<name>
<surname>Burgess</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Consistent estimation in mendelian randomization with some invalid instruments using a weighted median estimator</article-title>. <source>Genet. Epidemiol.</source> <volume>40</volume> (<issue>4</issue>), <fpage>304</fpage>&#x2013;<lpage>314</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/gepi.21965</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burgess</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Butterworth</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Thompson</surname> <given-names>S. G.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Mendelian randomization analysis with multiple genetic variants using summarized data</article-title>. <source>Genet. Epidemiol.</source> <volume>37</volume> (<issue>7</issue>), <fpage>658</fpage>&#x2013;<lpage>665</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/gepi.21758</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burgess</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Thompson</surname> <given-names>S. G.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Avoiding bias from weak instruments in Mendelian randomization studies</article-title>. <source>Int. J. Epidemiol.</source> <volume>40</volume> (<issue>3</issue>), <fpage>755</fpage>&#x2013;<lpage>764</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/ije/dyr036</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burgess</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Thompson</surname> <given-names>S. G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Interpreting findings from Mendelian randomization using the MR-Egger method</article-title>. <source>Eur. J. Epidemiol.</source> <volume>32</volume> (<issue>5</issue>), <fpage>377</fpage>&#x2013;<lpage>389</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10654-017-0255-x</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Burrows</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Bull</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Dudding</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Gormley</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Robinson</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>V.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <source>Genome-wide association study of cancer risk in UK biobank</source>. <publisher-loc>Beacon House, Bristol, United Kingdom</publisher-loc>: <publisher-name>University of Bristol</publisher-name>.</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Castellarin</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Warren</surname> <given-names>R. L.</given-names>
</name>
<name>
<surname>Freeman</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Dreolini</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Krzywinski</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Strauss</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Fusobacterium nucleatum infection is prevalent in human colorectal carcinoma</article-title>. <source>Genome Res.</source> <volume>22</volume> (<issue>2</issue>), <fpage>299</fpage>&#x2013;<lpage>306</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.126516.111</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cullin</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Azevedo Antunes</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Straussman</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Stein-Thoeringer</surname> <given-names>C. K.</given-names>
</name>
<name>
<surname>Elinav</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Microbiome and cancer</article-title>. <source>Cancer Cell</source> <volume>39</volume> (<issue>10</issue>), <fpage>1317</fpage>&#x2013;<lpage>1341</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ccell.2021.08.006</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dapito</surname> <given-names>D. H.</given-names>
</name>
<name>
<surname>Mencin</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Gwak</surname> <given-names>G.-Y.</given-names>
</name>
<name>
<surname>Pradere</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Jang</surname> <given-names>M. K.</given-names>
</name>
<name>
<surname>Mederacke</surname> <given-names>I.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Promotion of hepatocellular carcinoma by the intestinal microbiota and TLR4</article-title>. <source>Cancer Cell</source> <volume>21</volume> (<issue>4</issue>), <fpage>504</fpage>&#x2013;<lpage>516</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ccr.2012.02.007</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Elsworth</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Lyon</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Alexander</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Matthews</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Hallett</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>The MRC IEU OpenGWAS data infrastructure</article-title>. <source>bioRxiv</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2020.08.10.244293</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gopalakrishnan</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Helmink</surname> <given-names>B. A.</given-names>
</name>
<name>
<surname>Spencer</surname> <given-names>C. N.</given-names>
</name>
<name>
<surname>Reuben</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Wargo</surname> <given-names>J. A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>The influence of the gut microbiome on cancer, immunity, and cancer immunotherapy</article-title>. <source>Cancer Cell</source> <volume>33</volume> (<issue>4</issue>), <fpage>570</fpage>&#x2013;<lpage>580</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ccell.2018.03.015</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hashibe</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Brennan</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Chuang</surname> <given-names>S.-C.</given-names>
</name>
<name>
<surname>Boccia</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Castellsague</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>Interaction between tobacco and alcohol use and the risk of head and neck cancer: pooled analysis in the International Head and Neck Cancer Epidemiology Consortium</article-title>. <source>Cancer Epidemiol. Biomarkers Prev.</source> <volume>18</volume> (<issue>2</issue>), <fpage>541</fpage>&#x2013;<lpage>550</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/1055-9965.EPI-08-0347</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heck</surname> <given-names>J. E.</given-names>
</name>
<name>
<surname>Berthiller</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Vaccarella</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Winn</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>E. M.</given-names>
</name>
<name>
<surname>Shan'gina</surname> <given-names>O.</given-names>
</name>
<etal/>
</person-group>. (<year>2010</year>). <article-title>Sexual behaviours and the risk of head and neck cancers: a pooled analysis in the International Head and Neck Cancer Epidemiology (INHANCE) consortium</article-title>. <source>Int. J. Epidemiol.</source> <volume>39</volume> (<issue>1</issue>), <fpage>166</fpage>&#x2013;<lpage>181</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/ije/dyp350</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hemani</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Tilling</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Davey Smith</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Orienting the causal relationship between imprecisely measured traits using GWAS summary data</article-title>. <source>PloS Genet.</source> <volume>13</volume> (<issue>11</issue>), <elocation-id>e1007081</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pgen.1007081</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hemani</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Elsworth</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Wade</surname> <given-names>K. H.</given-names>
</name>
<name>
<surname>Haberland</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Baird</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>The MR-Base platform supports systematic causal inference across the human phenome</article-title>. <source>Elife</source> <volume>7</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.7554/eLife.34408</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>Y. S.</given-names>
</name>
<name>
<surname>Ho</surname> <given-names>S. B.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Intestinal goblet cells and mucins in health and disease: recent insights and progress</article-title>. <source>Curr. Gastroenterol. Rep.</source> <volume>12</volume> (<issue>5</issue>), <fpage>319</fpage>&#x2013;<lpage>330</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11894-010-0131-2</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kurilshikov</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Medina-Gomez</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Bacigalupe</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Radjabzadeh</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Demirkan</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Large-scale association analyses identify host factors influencing human gut microbiome composition</article-title>. <source>Nat. Genet.</source> <volume>53</volume> (<issue>2</issue>), <fpage>156</fpage>&#x2013;<lpage>165</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41588-020-00763-1</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lesseur</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Diergaarde</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Olshan</surname> <given-names>A. F.</given-names>
</name>
<name>
<surname>W&#xfc;nsch-Filho</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Ness</surname> <given-names>A. R.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Genome-wide association analyses identify new susceptibility loci for oral cavity and pharyngeal cancer</article-title>. <source>Nat. Genet.</source> <volume>48</volume> (<issue>12</issue>), <fpage>1544</fpage>&#x2013;<lpage>1550</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ng.3685</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maki</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Kazmi</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Barb</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>Ames</surname> <given-names>N.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>The oral and gut bacterial microbiomes: similarities, differences, and connections</article-title>. <source>Biol. Res. Nurs.</source> <volume>23</volume> (<issue>1</issue>). doi:&#xa0;<pub-id pub-id-type="doi">10.1177/1099800420941606</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Matson</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Chervin</surname> <given-names>C. S.</given-names>
</name>
<name>
<surname>Gajewski</surname> <given-names>T. F.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Cancer and the microbiome-influence of the commensal microbiota on cancer, immune responses, and immunotherapy</article-title>. <source>Gastroenterology</source> <volume>160</volume> (<issue>2</issue>), <fpage>600</fpage>&#x2013;<lpage>613</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1053/j.gastro.2020.11.041</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ni</surname> <given-names>J.-J.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>S.-S.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>B. X.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>X. T.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Gut microbiota and psychiatric disorders: A two-sample mendelian randomization study</article-title>. <source>Front. Microbiol.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2021.737197</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ochi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Nguyen</surname> <given-names>A. H.</given-names>
</name>
<name>
<surname>Bedrosian</surname> <given-names>A. S.</given-names>
</name>
<name>
<surname>Mushlin</surname> <given-names>H. M.</given-names>
</name>
<name>
<surname>Zarbakhsh</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Barilla</surname> <given-names>R. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>MyD88 inhibition amplifies dendritic cell capacity to promote pancreatic carcinogenesis <italic>via</italic> Th2 cells</article-title>. <source>J. Exp. Med.</source> <volume>209</volume> (<issue>9</issue>), <fpage>1671</fpage>&#x2013;<lpage>1687</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1084/jem.20111706</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Papadimitriou</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Dimou</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Tsilidis</surname> <given-names>K. K.</given-names>
</name>
<name>
<surname>Banbury</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Martin</surname> <given-names>R. M.</given-names>
</name>
<name>
<surname>Lewis</surname> <given-names>S. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Physical activity and risks of breast and colorectal cancer: a Mendelian randomisation analysis</article-title>. <source>Nat. Commun.</source> <volume>11</volume> (<issue>1</issue>), <fpage>597</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-020-14389-8</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pierce</surname> <given-names>B. L.</given-names>
</name>
<name>
<surname>Burgess</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Efficient design for Mendelian randomization studies: subsample and 2-sample instrumental variable estimators</article-title>. <source>Am. J. Epidemiol.</source> <volume>178</volume> (<issue>7</issue>), <fpage>1177</fpage>&#x2013;<lpage>1184</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/aje/kwt084</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rajagopala</surname> <given-names>S. V.</given-names>
</name>
<name>
<surname>Vashee</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Oldfield</surname> <given-names>L. M.</given-names>
</name>
<name>
<surname>Suzuki</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Venter</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Telenti</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>The human microbiome and cancer</article-title>. <source>Cancer Prev. Res. (Phila)</source> <volume>10</volume> (<issue>4</issue>), <fpage>226</fpage>&#x2013;<lpage>234</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1158/1940-6207.CAPR-16-0249</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salzman</surname> <given-names>N. H.</given-names>
</name>
<name>
<surname>Underwood</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Bevins</surname> <given-names>C. L.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Paneth cells, defensins, and the commensal microbiota: a hypothesis on intimate interplay at the intestinal mucosa</article-title>. <source>Semin. Immunol.</source> <volume>19</volume> (<issue>2</issue>), <fpage>70</fpage>&#x2013;<lpage>83</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.smim.2007.04.002</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sanna</surname> <given-names>S.</given-names>
</name>
<name>
<surname>van Zuydam</surname> <given-names>N. R.</given-names>
</name>
<name>
<surname>Mahajan</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Kurilshikov</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Vich Vila</surname> <given-names>A.</given-names>
</name>
<name>
<surname>V&#xf5;sa</surname> <given-names>U.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Causal relationships among the gut microbiome, short-chain fatty acids and metabolic diseases</article-title>. <source>Nat. Genet.</source> <volume>51</volume> (<issue>4</issue>), <fpage>600</fpage>&#x2013;<lpage>605</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41588-019-0350-x</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shim</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Chasman</surname> <given-names>D. I.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Mora</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ridker</surname> <given-names>P. M.</given-names>
</name>
<name>
<surname>Nickerson</surname> <given-names>D. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>A multivariate genome-wide association analysis of 10 LDL subfractions, and their response to statin treatment, in 1868 Caucasians</article-title>. <source>PloS One</source> <volume>10</volume> (<issue>4</issue>), <elocation-id>e0120758</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0120758</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Skrivankova</surname> <given-names>V. W.</given-names>
</name>
<name>
<surname>Richmond</surname> <given-names>R. C.</given-names>
</name>
<name>
<surname>Woolf</surname> <given-names>B. A. R.</given-names>
</name>
<name>
<surname>Davies</surname> <given-names>N. M.</given-names>
</name>
<name>
<surname>Swanson</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>VanderWeele</surname> <given-names>T. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Strengthening the reporting of observational studies in epidemiology using mendelian randomisation (STROBE-MR): explanation and elaboration</article-title>. <source>BMJ</source> <volume>375</volume>, <elocation-id>n2233</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/bmj.n2233</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Verbanck</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.-Y.</given-names>
</name>
<name>
<surname>Neale</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Do</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Detection of widespread horizontal pleiotropy in causal relationships inferred from Mendelian randomization between complex traits and diseases</article-title>. <source>Nat. Genet.</source> <volume>50</volume> (<issue>5</issue>), <fpage>693</fpage>&#x2013;<lpage>698</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41588-018-0099-7</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>V&#xe9;tizou</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Pitt</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Daill&#xe8;re</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Lepage</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Waldschmitt</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Flament</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Anticancer immunotherapy by CTLA-4 blockade relies on the gut microbiota</article-title>. <source>Science</source> <volume>350</volume> (<issue>6264</issue>), <fpage>1079</fpage>&#x2013;<lpage>1084</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.aad1329</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wade</surname> <given-names>K. H.</given-names>
</name>
<name>
<surname>Hall</surname> <given-names>L. J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Improving causality in microbiome research: can human genetic epidemiology help</article-title>? <source>Wellcome Open Res.</source> <volume>4</volume>, <fpage>199</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.12688/wellcomeopenres.15628.3</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Warnakulasuriya</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Global epidemiology of oral and oropharyngeal cancer</article-title>. <source>Oral. Oncol.</source> <volume>45</volume> (<issue>4-5</issue>), <fpage>309</fpage>&#x2013;<lpage>316</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.oraloncology.2008.06.002</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yachida</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Mizutani</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Shiroma</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Shiba</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Nakajima</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Sakamoto</surname> <given-names>T.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Metagenomic and metabolomic analyses reveal distinct stage-specific phenotypes of the gut microbiota in colorectal cancer</article-title>. <source>Nat. Med.</source> <volume>25</volume> (<issue>6</issue>), <fpage>968</fpage>&#x2013;<lpage>976</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41591-019-0458-7</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yavorska</surname> <given-names>O. O.</given-names>
</name>
<name>
<surname>Burgess</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>MendelianRandomization: an R package for performing Mendelian randomization analyses using summarized data</article-title>. <source>Int. J. Epidemiol.</source> <volume>46</volume> (<issue>6</issue>), <fpage>1734</fpage>&#x2013;<lpage>1739</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/ije/dyx034</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname> <given-names>L.-X.</given-names>
</name>
<name>
<surname>Schwabe</surname> <given-names>R. F.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The gut microbiome and liver cancer: mechanisms and clinical translation</article-title>. <source>Nat. Rev. Gastroenterol. Hepatol.</source> <volume>14</volume> (<issue>9</issue>), <fpage>527</fpage>&#x2013;<lpage>539</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrgastro.2017.72</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Tao</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Demystifying the manipulation of host immunity, metabolism, and extraintestinal tumors by the gut microbiome</article-title>. <source>Signal Transduct Target Ther.</source> <volume>4</volume>, <elocation-id>41</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41392-019-0074-5</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>C.-B.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Y.-L.</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>J.-Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Gut microbiota in cancer immune response and immunotherapy</article-title>. <source>Trends Cancer</source> <volume>7</volume> (<issue>7</issue>), <fpage>647</fpage>&#x2013;<lpage>660</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.trecan.2021.01.010</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>