<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">856212</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2022.856212</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>An Epistatic Network Describes <italic>oppA</italic> and <italic>glgB</italic> as Relevant Genes for <italic>Mycobacterium tuberculosis</italic>
</article-title>
<alt-title alt-title-type="left-running-head">Posada-Reyes et al.</alt-title>
<alt-title alt-title-type="right-running-head">Epistatic Network for <italic>Mycobacterium tuberculosis</italic>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Posada-Reyes</surname>
<given-names>Ali-Berenice</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1651788/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Balderas-Mart&#xed;nez</surname>
<given-names>Yalbi I.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1056827/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>&#xc1;vila-R&#xed;os</surname>
<given-names>Santiago</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1525360/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Vinuesa</surname>
<given-names>Pablo</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/225282/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Fonseca-Coronado</surname>
<given-names>Salvador</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1599290/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Posgrado en Ciencias Biol&#xf3;gicas</institution>, <institution>UNAM</institution>, <addr-line>Mexico</addr-line>, <country>Mexico</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Facultad de Estudios Superiores Cuautitl&#xe1;n</institution>, <institution>UNAM</institution>, <addr-line>Estado de Mexico</addr-line>, <country>Mexico</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Instituto Nacional de Enfermedades Respiratorias &#x201c;Ismael Cosio Villegas&#x201d;</institution>, <addr-line>Ciudad de Mexico</addr-line>, <country>Mexico</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Centro de Ciencias Gen&#xf3;micas</institution>, <institution>UNAM</institution>, <addr-line>Cuernavaca</addr-line>, <country>Mexico</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/592883/overview">Alberto Jesus Martin</ext-link>, Universidad Mayor, Chile</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/542716/overview">Ramandeep Singh</ext-link>, Translational Health Science and Technology Institute (THSTI), India</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/467487/overview">Verlaine Joy Timms</ext-link>, The University of Newcastle, Australia</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Ali-Berenice Posada-Reyes, <email>bereniceposadareyes@yahoo.com.mx</email>; Salvador Fonseca-Coronado, <email>fonsecacoronado@yahoo.com</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Biological Modeling and Simulation, a section of the journal Frontiers in Molecular Biosciences</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>31</day>
<month>05</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>9</volume>
<elocation-id>856212</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>01</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>11</day>
<month>03</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Posada-Reyes, Balderas-Mart&#xed;nez, &#xc1;vila-R&#xed;os, Vinuesa and Fonseca-Coronado.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Posada-Reyes, Balderas-Mart&#xed;nez, &#xc1;vila-R&#xed;os, Vinuesa and Fonseca-Coronado</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>
<italic>Mycobacterium tuberculosis</italic> is an acid-fast bacterium that causes tuberculosis worldwide. The role of epistatic interactions among different loci of the <italic>M. tuberculosis</italic> genome under selective pressure may be crucial for understanding the disease and the molecular basis of antibiotic resistance acquisition. Here, we analyzed polymorphic loci interactions by applying a model-free method for epistasis detection, SpydrPick, on a pan&#x2013;genome-wide alignment created from a set of 254 complete reference genomes. By means of the analysis of an epistatic network created with the detected epistatic interactions, we found that <italic>glgB</italic> (<italic>&#x3b1;</italic>-1,4-glucan branching enzyme) and <italic>oppA</italic> (oligopeptide-binding protein) are putative targets of co-selection in <italic>M. tuberculosis</italic> as they were associated in the network with <italic>M. tuberculosis</italic> genes related to virulence, pathogenesis, transport system modulators of the immune response, and antibiotic resistance. In addition, our work unveiled potential pharmacological applications for genotypic antibiotic resistance inherent to the mutations of <italic>glgB</italic> and <italic>oppA</italic> as they epistatically interact with <italic>fprA</italic> and <italic>embC</italic>, two genes recently included as antibiotic-resistant genes in the catalog of the World Health Organization. Our findings showed that this approach allows the identification of relevant epistatic interactions that may lead to a better understanding of <italic>M. tuberculosis</italic> by deciphering the complex interactions of molecules involved in its metabolism, virulence, and pathogenesis and that may be applied to different bacterial populations.</p>
</abstract>
<kwd-group>
<kwd>
<italic>glgB</italic>
</kwd>
<kwd>
<italic>oppA</italic>
</kwd>
<kwd>epistatic network</kwd>
<kwd>co-selection</kwd>
<kwd>
<italic>Mycobacterium tuberculosis</italic>
</kwd>
<kwd>tuberculosis</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>In humans, tuberculosis (TB) is a chronic and highly contagious disease that causes more than 10 million human infections and 1.8 million deaths worldwide every year. The constant arrival of drug-resistant strains complicates its control and eradication (<xref ref-type="bibr" rid="B19">Gupta et al., 2018</xref>). This disease is mainly caused by members of the <italic>Mycobacterium tuberculosis</italic> complex (MTBC) (<xref ref-type="bibr" rid="B9">Coscolla and Gagneux, 2014</xref>) <italic>via</italic> aerosolized bacteria released by patients with TB (<xref ref-type="bibr" rid="B28">Lerner et al., 2015</xref>).</p>
<p>
<italic>Mycobacterium tuberculosis</italic> (Mtb) lineages L1&#x2013;L4 and L7 form a large group of human-adapted strains responsible for the vast majority of global human TB cases, whereas <italic>Mycobacterium africanum</italic> lineages (L5 and L6), which are restricted to humans from West Africa, are phylogenetically linked with the eighth lineage, which comprises various animal-adapted strains (<xref ref-type="bibr" rid="B16">Gonzalo-Asensio et al., 2014</xref>).</p>
<p>The first complete genome sequence of Mtb was described in 1998 (<xref ref-type="bibr" rid="B8">Cole et al., 1998</xref>). Since then, whole-genome sequencing (WGS) has been applied to a wide range of clinical scenarios, with the potential to revolutionize TB diagnosis, outbreak investigation, development of drugs and vaccines, and to assist in understanding the evolution and pathogenicity of MTBC (<xref ref-type="bibr" rid="B39">Satta et al., 2018</xref>). The increase in genomic data in this new era of big data can be considered a great opportunity to continue with the epidemiological surveillance of Mtb associated with the evaluation of genotypic antibiotic resistance. Moreover, it may allow us to unveil new genes with characteristics that lead us to a better understanding of TB.</p>
<p>Recent advances in the scale and diversity of population genomic data for Mtb provide the potential for revealing whole-genome genetic patterns. Statistical methods combined with recent advances in computational structural biology have identified the polymorphic loci (positions inside a genome) under the strongest co-evolutionary pressures or epistatic interactions (<xref ref-type="bibr" rid="B42">Skwark et al., 2017</xref>). Such epistatic interactions describe a functional relationship between genes or polymorphic loci (<xref ref-type="bibr" rid="B38">Sackton and Hartl, 2016</xref>). Studies of interactions between mutations in Mtb that result in resistance to diverse drugs have suggested that epistasis may be related to multidrug resistance (<xref ref-type="bibr" rid="B44">Trauner et al., 2014</xref>; <xref ref-type="bibr" rid="B25">Kavvas et al., 2018</xref>). However, the role of epistatic interactions among many regions of the genome under selection in Mtb remains unknown, and further study will contribute to improving our knowledge of TB.</p>
<p>In this study, we analyzed polymorphic loci interactions for epistatic detection in a set of 254 complete reference genomes from Mtb by the use of the model-free method, SpydrPick (<xref ref-type="bibr" rid="B36">Pensar et al., 2019</xref>). SpydrPick is based on calculating the mutual information between two polymorphic loci. This well-annotated reference collection integrates genome annotation, gene characterization, and a sequence variation report with a high certainty of genomic location. First, a pan-genome was created using Roary (<xref ref-type="bibr" rid="B33">Page et al., 2015</xref>). Then, using AMAS, a pan&#x2013;genome-wide alignment was obtained by concatenating individual gene alignments. This pan&#x2013;genome-wide alignment was the input for SpydrPick.</p>
<p>The application of the method to this data set allowed us to reconstruct an epistatic network. The analysis of this network revealed two putative targets of co-selection (<italic>glgB</italic> and <italic>oppA</italic>) associated with Mtb genes related to virulence, pathogenesis, transport system modulators of the immune response, and antibiotic resistance. This work may have relevant applications in the characterization of new genes involved in the worldwide problem of Mtb drug resistance (<xref ref-type="bibr" rid="B46">WHO, 2021</xref>).</p>
</sec>
<sec id="s2">
<title>2 Materials and Methods</title>
<p>An overview of our approach is depicted in <xref ref-type="fig" rid="F1">Figure 1</xref>. The steps are described in the following subsections.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Pipeline for the study of epistatic interactions in Mtb.</p>
</caption>
<graphic xlink:href="fmolb-09-856212-g001.tif"/>
</fig>
<sec id="s2-1">
<title>2.1 Data Set</title>
<p>We gathered 254 reference strains of Mtb from the NCBI Refseq database that was available as of 4 November 2020. The list of strains is provided as <xref ref-type="sec" rid="s10">Supplementary Data S1</xref>.</p>
</sec>
<sec id="s2-2">
<title>2.2 Creating Pan&#x2013;Genome-Wide Alignment</title>
<p>Following the strategy of <xref ref-type="bibr" rid="B36">Pensar et al. (2019)</xref>, we created a pan&#x2013;genome-wide alignment of the 254 strains. First, we employed Prokka (<xref ref-type="bibr" rid="B40">Seemann, 2014</xref>) to annotate genes and features of interest in the set of strains. This genome annotation (GFF3 format) was the input to create a pan-genome of the strains with Roary (<xref ref-type="bibr" rid="B33">Page et al., 2015</xref>).</p>
<p>This tool extracts the gene sequences from the input and then identifies clusters to obtain gene alignments. Roary considers two categories of genes: core and accessory. A gene is considered &#x201c;core&#x201d; if it is in at least a certain percentage of strains (isolates) defined by the user. In our study, we followed the approach of <xref ref-type="bibr" rid="B36">Pensar et al. (2019)</xref>, who set this percentage on 95% strains. The output of Roary is a set of files with individual gene alignments, with one file per gene. These files are concatenated in a matrix using the Alignment Manipulation and Summary (AMAS) tool (<xref ref-type="bibr" rid="B5">Borowiec, 2016</xref>). This matrix is formed by gene 1 joined on the right with gene 2 and so on with the rest of the genes [see the example &#x201c;A: concatenation&#x201d; from <xref ref-type="fig" rid="F1">Figure 1</xref> in <xref ref-type="bibr" rid="B5">Borowiec (2016)</xref>]. Thus, the columns of the output matrix are the genes, and the number of rows is the number of strains used to generate the pan&#x2013;genome-wide alignment (254 in this case).</p>
</sec>
<sec id="s2-3">
<title>2.3 Global Diversity Evaluation</title>
<p>The pan&#x2013;genome-wide alignment was evaluated for global diversity by estimating a phylogeny using RAxML Next Generation (<xref ref-type="bibr" rid="B27">Kozlov et al., 2019</xref>). A standard nonparametric bootstrap of 1,000 replicates was performed. Phylogenies were visualized using iTOL v. 6.4.1 (<xref ref-type="bibr" rid="B29">Letunic and Bork, 2021</xref>).</p>
</sec>
<sec id="s2-4">
<title>2.4 Genetic Prediction of Antibiotic Resistance</title>
<p>We predicted a resistome for the 254 strains using the Resistance Gene Identifier (RGI) tool v. 5.1.1 (<xref ref-type="bibr" rid="B1">Alcock et al., 2020</xref>). RGI uses the Comprehensive Antibiotic Resistance Database (CARD) as reference data. Using the output of RGI, we annotated strains for two genotypic characterizations of antibiotic resistance: multidrug-resistant (MDR) strains for those strains with genes resistant to isoniazid and rifampicin and extensively drug-resistant (XDR) strains if they have genes resistant to isoniazid, rifampicin, fluoroquinolone, and at least one of the following three antibiotics: kanamycin, amikacin, or capreomycin. These annotations were incorporated for visualization into the phylogeny displayed by iTOL.</p>
</sec>
<sec id="s2-5">
<title>2.5 Computational Detection of Epistatic Interactions</title>
<sec id="s2-5-1">
<title>2.5.1 Epistatic Interaction Detection</title>
<p>We utilized SpydrPick (<xref ref-type="bibr" rid="B36">Pensar et al., 2019</xref>) to detect the epistatic interactions in the pan&#x2013;genome-wide alignment. SpydrPick is a model-free method whose computational efficiency enables analysis at the scale of pan-genomes of bacteria. This method facilitates the detection of targets of co-selection related to virulence and antibiotic resistance. The potential of this method is the detection of epistatic interactions in the absence of phenotypic data.</p>
<p>The approach of SpydrPick is based on calculating the mutual information (MI) between two polymorphic loci. MI is an information-theoretic measure of the amount of information that one random variable, <italic>X</italic>, contains about another random variable, <italic>Y</italic>. MI is also defined as the reduction in uncertainty in <italic>X</italic> after observing <italic>Y</italic>; in other words, MI manifests the reduction in uncertainty of <italic>X</italic> due to the knowledge of <italic>Y</italic> (<xref ref-type="bibr" rid="B10">Cover and Thomas, 2006</xref>). MI gives a measure of association or correlation between <italic>X</italic> and <italic>Y</italic> (<xref ref-type="bibr" rid="B7">Chanda et al., 2020</xref>); if the two variables, <italic>X</italic> and <italic>Y</italic>, are independent, then the MI is zero. MI is formally defined as follows:<disp-formula id="e1">
<mml:math id="m1">
<mml:mi>M</mml:mi>
<mml:mi>I</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>X</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>Y</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:munder>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:munder>
<mml:munder>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:munder>
<mml:mi>p</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mi>log</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mi>p</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
</mml:math>
<label>(1)</label>
</disp-formula>where <italic>p</italic> (<italic>x</italic>, <italic>y</italic>) is the joint probability and <italic>p</italic>(<italic>x</italic>) and <italic>p</italic>(<italic>y</italic>) are the marginal probabilities of <italic>X</italic> and <italic>Y</italic>. MI has been successfully used for detecting co-selection in bacterial population genomics at a genome-wide scale. Another relevant feature introduced by SpydrPick&#x2019;s approach is the correction for the population structure. This is applied by a sequence reweighting strategy based on how different are the sequences in the pan&#x2013;genome-wide alignment (<xref ref-type="bibr" rid="B36">Pensar et al., 2019</xref>).</p>
<p>SpydrPick detects direct and indirect interactions between loci. A direct interaction occurs between two positions (<italic>P</italic>
<sub>1</sub> &#x2192; <italic>P</italic>
<sub>2</sub>), whereas an indirect interaction occurs when the two positions (<italic>P</italic>
<sub>1</sub> and <italic>P</italic>
<sub>2</sub>) are also linked through a third position (<italic>P</italic>
<sub>1</sub> &#x2192; <italic>P</italic>
<sub>3</sub> &#x2192; <italic>P</italic>
<sub>2</sub>). In the case of indirect interactions (<italic>P</italic>
<sub>1</sub> &#x2192; <italic>P</italic>
<sub>2</sub>), SpydrPick removes the interaction if the MI is not larger than the other two interactions (<italic>P</italic>
<sub>1</sub> &#x2192; <italic>P</italic>
<sub>3</sub> and <italic>P</italic>
<sub>3</sub> &#x2192; <italic>P</italic>
<sub>2</sub>).</p>
<p>In addition, SpydrPick performs an analysis to detect outlier interactions. A first criterion to filter outliers is that the distance (bp) between the positions of polymorphic loci must be greater than a linkage disequilibrium (LD) parameter. In this case, a strong LD refers to a close genetic distance between two nucleotide positions. Due to a strong LD hiding a prospective signal of shared co-evolutionary selection pressure, SpydrPick filters out pairs of positions with strong LD to select outlier interactions. According to the SpydrPick&#x2019;s documentation (<ext-link ext-link-type="uri" xlink:href="https://github.com/santeripuranen/SpydrPick">https://github.com/santeripuranen/SpydrPick</ext-link>), for bacterial genomes, the typical values of the LD are in the 500&#x2013;20,000&#xa0;bp range, and the default approach to filtering out strong LD pairs is using a simple distance-based cut-off (20,000 in our case). The second criterion is that the MI must be greater than a threshold obtained from Tukey&#x2019;s outlier test <italic>Q</italic>
<sub>3</sub> &#x2b; 1.5 &#xd7; (<italic>Q</italic>
<sub>3</sub> &#x2212; <italic>Q</italic>
<sub>1</sub>) (<xref ref-type="bibr" rid="B45">Tukey, 1977</xref>).</p>
<p>The output of SpydrPick is a table of epistatic interactions that includes the pair of positions of two interacting polymorphic loci in the pan&#x2013;genome-wide alignment, the genome distance between the two positions, the type of interaction (direct/indirect), and the MI score. When SpydrPick detects outliers, they are reported in another table, including three additional fields: the MI score without gaps, the gap effect, and if the outlier is considered an extreme outlier (<italic>MI</italic> &#x3e; <italic>Q</italic>
<sub>3</sub> &#x2b; 3 &#xd7; (<italic>Q</italic>
<sub>3</sub>&#x2014;<italic>Q</italic>
<sub>1</sub>)). From the input alignment, SpydPick categorizes any character different from A, C, G, and T as a gap. Gaps are considered in the default MI calculation, so <italic>X</italic> and <italic>Y</italic> have an outcome space of five categories. As the gaps may not be informative, SpydrPick calculates for each pair of positions in the outliers another MI score considering only those strains without gaps in either of the two positions. This MI score is named mutual information without gaps (MI_wo_gaps). Using the MI score without gaps, the gap effect is calculated as (1&#x2014;<italic>MI</italic>_<italic>wo</italic>_<italic>gaps</italic>/<italic>MI</italic>) &#xd7; 100 to quantify the positive or negative effect on the MI by discarding strains with gaps in the two positions.</p>
<p>Comparing MI scores without gaps in a meaningful way is difficult due to the fact that the set of strains without gaps in the two positions varies between pairs of positions (<xref ref-type="bibr" rid="B36">Pensar et al., 2019</xref>). However, a high value of the gap effect for a given pair of positions may indicate a gap-driven interaction, and a manual analysis of the pair should be required. Thus, following the analysis performed by <xref ref-type="bibr" rid="B36">Pensar et al. (2019)</xref>, we used the default MI, leaving the analysis of the MI_wo_gaps for a future in-depth study.</p>
<p>The loci of epistatic interaction were annotated with gene id and gene name. Gene names were obtained from the partitions generated by AMAS using an R script. Afterward, using another R script (<ext-link ext-link-type="uri" xlink:href="https://github.com/biotb/epitb-net">https://github.com/biotb/epitb-net</ext-link>) and the R Biomartr library (<xref ref-type="bibr" rid="B15">Drost and Paszkowski, 2017</xref>), we retrieved the ENTREZ gene id by searching the gene name in the GFF file of the Mtb H37Rv reference genome (GCF_000195955.2).</p>
<p>If there is no gene name detected by Roary during the pan-genome creation, then Roary gives a unique generic name formed by the prefix group and a consecutive number. These generic names also appear in partitions of AMAS; however, no ENTREZ id could be associated with these generic names as these names did not exist in the reference genome GFF file.</p>
<p>On the other hand, Prokka was indicated by a numeric suffix different annotation for the same gene, such as carB_1 and carB_2 (carbamoyl-phosphate synthase large chain). These names were also not found in the reference genome GFF file. In these cases, we eliminated the numeric suffix to find the gene name in the reference genome file. For example, we were able to find the gene id 886,253 for <italic>carB</italic>.</p>
</sec>
<sec id="s2-5-2">
<title>2.5.2 Functional Enrichment Analysis</title>
<p>We used the database for annotation, visualization, and integrated discovery (DAVID) v6.8 (<xref ref-type="bibr" rid="B22">Huang et al., 2009</xref>) to obtain a functional annotation of Gene Ontology (GO) terms and KEGG pathways of the genes participating in the epistatic interactions. Specifically, we used the DAVID Web Service Python Script (<xref ref-type="bibr" rid="B24">Jiao et al., 2012</xref>) to generate a chart report.</p>
</sec>
<sec id="s2-5-3">
<title>2.5.3 Network of Epistatic Interactions</title>
<p>The set of epistatic interactions can be seen as a model of complex epistatic relations that may be analyzed and displayed as a network. Here, we used Cytoscape (<xref ref-type="bibr" rid="B26">Kohl et al., 2011</xref>) to study our set of epistatic interactions. This tool has been utilized for studying diverse types of genetic networks. Cytoscape includes an Analyze Network Tool that calculates several network parameters, such as node degree and betweenness centrality. Another useful tool of Cytoscape is the set of layout algorithms based on the yFile Layout Algorithm App. These algorithms visually organized a network by aligning and rotating groups of nodes.</p>
</sec>
<sec id="s2-5-4">
<title>2.5.4 Highly Connected Nodes Analysis and Visualization</title>
<p>We focused on the most highly connected genes (the highest degree) for analyzing our epistatic network. Functional characterization of these genes was performed by literature curation and showing enriched GO terms for genes interacting with them. In addition, we used the R package SeqinR (<xref ref-type="bibr" rid="B18">Gouy et al., 1985</xref>) to upload the pan&#x2013;genome-wide alignment and extract the allele distribution at loci involved in their epistatic interactions. We used the interactive web tool Phandango, which is used to visualize phylogenetic trees and associated genomic information (<xref ref-type="bibr" rid="B20">Hadfield et al., 2017</xref>), to show the estimated phylogeny and allele distribution of loci.</p>
</sec>
</sec>
</sec>
<sec sec-type="results|discussion" id="s3">
<title>3 Results and Discussion</title>
<sec id="s3-1">
<title>3.1 Pan&#x2013;Genome-Wide Alignment</title>
<p>A total of 6,205 individual genes were aligned by Roary, including 3,659 core genes. After concatenating all individual genes with AMAS, a pan&#x2013;genome-wide alignment of 6,751,593&#xa0;bp was obtained.</p>
</sec>
<sec id="s3-2">
<title>3.2 Estimated Phylogeny and Antibiotic Resistance Prediction</title>
<p>Based on Akaike Information Criterion (AIC) and the Bayesian Information Criterion (BIC), which are theoretical information criteria to penalize complex models, we selected the estimated phylogeny using a GTR model with four free rates (GTR-R4-FO). The comparison of models is provided in <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>. Convergence using the extended majority rule (MRE) criterion (<xref ref-type="bibr" rid="B35">Pattengale et al., 2010</xref>) with a 3% cutoff for the bootstrapping was reached after 400 trees.</p>
<p>The prediction of antibiotic resistance by RGI reported that 100% of the 254 strains were MDR (<xref ref-type="fig" rid="F2">Figure 2</xref>) and, within this, 15% were XDR. This result indicates that bacterial strains, perhaps currently circulating, present a high level of resistance to first-line treatments, hindering the successful response to treatment and facilitating the dissemination of strains with drug resistance mutations. Thus, detecting epistatic interactions to elucidate polymorphic loci under the strongest co-evolutionary pressure is of utmost importance for molecular surveillance with bioinformatic tools that help us characterize them promptly. Currently, it is reported that 3.4% of the new TB patients and 20% of the patients with a history of previous treatment for TB were diagnosed with MDR TB worldwide (<xref ref-type="bibr" rid="B46">WHO, 2021</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Phylogenetic tree pan-genome Mtb is an iTOL circular visualization with the branch length and the bootstrap values displayed. The tree is based on the Maximum Likelihood topology of 254 strains representative of Mtb diversity and shows that length is proportional to nucleotide topology. Bootstrap values for clades corresponding to the main Mtb clades are shown. The colors correspond to the different genotypic characterizations of antibiotic resistance (MDR &#x3d; Multidrug Resistant; XDR &#x3d; Extensively Drug-Resistant).</p>
</caption>
<graphic xlink:href="fmolb-09-856212-g002.tif"/>
</fig>
<p>The phylogenetic tree (<xref ref-type="fig" rid="F2">Figure 2</xref>) shows the nucleotide diversity of Mtb (254 strain collection). In this study, there is heterogeneity of submitters, 100% of the strains present genes linked to antibiotic resistance and with respect to the H37Rv strain (reference), and most of the strains present greater genetic diversity.</p>
</sec>
<sec id="s3-3">
<title>3.3 Detected Epistatic Interactions</title>
<p>SpydrPick detected 10,573 outlier epistatic interactions (5,484 directed and 5,089 indirect). These interactions describe polymorphic loci under the strongest co-evolutionary pressure. A table with the complete list of outliers is provided as <xref ref-type="sec" rid="s10">Supplementary Data S2</xref>. This table includes the fields described in <xref ref-type="sec" rid="s2-5-1">subsection 2.5.1</xref>, that is, the pair of positions of the two interacting polymorphic loci in the pan&#x2013;genome-wide alignment, genome distance between the two positions, type of interaction (direct/indirect), MI score, MI score without gaps, gap effect, and whether the outlier interaction is considered an extreme outlier.</p>
<p>After gene annotation, we generated a new table of epistatic interactions that excluded the generic gene names given by Roary. The new table of outliers included 1,940 epistatic interactions among 107 unique genes. From this set of genes, we only found 70 in the reference genome GFF file, and they were associated with their ENTREZ id. Filtering only those interactions, including these 70 genes, we obtained a final table with 890 outlier interactions. The remaining interactions that were not considered in our study will be included in a future analysis.</p>
<p>The final table of outlier interactions includes the two positions of the two interacting polymorphic loci in the pan&#x2013;genome-wide alignment, gene ENTREZ id and gene name for each position, distance between the two positions (bp), type of interaction (direct &#x3d; 1, indirect &#x3d; 0), MI score of the interaction, and if the interaction outlier is an extreme outlier (yes &#x3d; 1, no &#x3d; 0). This final table of outliers (<xref ref-type="sec" rid="s10">Supplementary Data S3</xref>) was used for enrichment analysis, network reconstruction, and analyses.</p>
<p>SpydrPick was able to find long-distance interactions surpassing the two million bp (<xref ref-type="table" rid="T1">Table 1</xref>). This fact confirms that our study has a whole-genome scale. However, because we identified epistatic interactions from a pan&#x2013;genome-wide alignment constructed by concatenating individual gene alignments, the positions are not straightforward whole-genome loci. The minimum distance (bp) between the positions of the two interacting polymorphic loci nearly surpassed the LD criterion of 20,000&#xa0;bp. The mean of the distance between polymorphic loci in the outlier interactions was 846,454&#xa0;bp; considering that it is greater than the median (721,980&#xa0;bp), there may be a slight skewness to distances lower than the mean. On the other hand, the range of MI scores was short, from 0.4130 to 0.5020 (<xref ref-type="table" rid="T1">Table 1</xref>). The MI scores might show a skewness to low values as the mean (0.4509) was higher than the median (0.4202).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Statistics of the distance between positions of the two interacting polymorphic loci and statistics of the MI scores, both for the final outlier interactions.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Statistic of the final outlier interactions</th>
<th align="center">Values</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Minimum distance (bp)</td>
<td align="center">20,870</td>
</tr>
<tr>
<td align="left">Maximum distance (bp)</td>
<td align="center">2,328,291</td>
</tr>
<tr>
<td align="left">Median distance (bp)</td>
<td align="center">721,980</td>
</tr>
<tr>
<td align="left">Mean distance (bp)</td>
<td align="center">846,454</td>
</tr>
<tr>
<td align="left">Minimum MI score</td>
<td align="center">0.4130</td>
</tr>
<tr>
<td align="left">Maximum MI score</td>
<td align="center">0.5020</td>
</tr>
<tr>
<td align="left">Median MI score</td>
<td align="center">0.4202</td>
</tr>
<tr>
<td align="left">Mean MI score</td>
<td align="center">0.4509</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>All loci in the 890 interactions were found in the described single-nucleotide polymorphisms (SNPs) when we used the pan&#x2013;genome-wide alignment with the tool SNP-sites v. 2.5.1, which can rapidly identify SNPs from a multi-FASTA alignment (<xref ref-type="bibr" rid="B34">Page et al., 2016</xref>). This additional step was developed to identify polymorphisms involved in the detected epistatic interactions.</p>
</sec>
<sec id="s3-4">
<title>3.4 Epistatic Network Analysis</title>
<sec id="s3-4-1">
<title>3.4.1 <italic>glgB</italic> and <italic>oppA</italic> as Putative Targets of Co-selection</title>
<p>The network of epistatic interactions was analyzed to figure out those genes with a high node degree (the number of edges), that is, a high level of connectivity of the gene with other genes. The most highly connected genes were <italic>glgB</italic> (ENTREZ:886,893, degree &#x3d; 56), a <italic>&#x3b1;</italic>-1,4-glucan branching enzyme (GlgB), and <italic>oppA</italic> (ENTREZ:886,985, degree &#x3d; 37), an oligopeptide-binding protein (OppA) (<xref ref-type="fig" rid="F3">Figure 3</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Network of outlier epistatic interactions. The gradient color of nodes depicts the node degree. The gradient color of edges depicts values of MI.</p>
</caption>
<graphic xlink:href="fmolb-09-856212-g003.tif"/>
</fig>
<p>These two genes also have the highest value of betweenness centrality (<italic>glgB</italic> &#x3d; 0.493, <italic>oppA</italic> &#x3d; 0.219). Betweenness centrality is higher for those nodes that join subnets (communities) than those located inside the subnets. Here, we observed three subnets connected by these two genes. An interesting pattern is that each subnet has a different distribution of values of MI (see gradient color of edges in <xref ref-type="fig" rid="F3">Figure 3</xref>). The subnet at the bottom has higher MI values (median MI &#x3d; 0.502) than the other two, the top subnet has a median MI of 0.463, and the subnet at the middle has lower values (median MI &#x3d; 0.420). A further study is required to elucidate the cause of this pattern. In addition, future analysis will be required to identify the patterns associated with the isolated subnets (<italic>mmpL1</italic>-<italic>mmpS4</italic> and <italic>lipR</italic>-<italic>ponA1</italic>).</p>
<p>Thus, we consider these two genes as relevant putative targets of co-selection because they may be associated with several genes related to potential pharmacological applications. The GlgB enzyme (encoded by Rv1326c) is the key enzyme involved in the biosynthesis of <italic>&#x3b1;</italic>-glucan, which plays a significant role in the virulence and pathogenesis of Mtb. Recently, enzymes that participate in the biosynthesis of trehalose have gained major attention as drug targets, especially in Mtb (<xref ref-type="bibr" rid="B13">Dkhar et al., 2015</xref>), as capsular polysaccharides of bacteria have been found to modulate the host immune response. The importance of the metabolism of GlgB has been described (<xref ref-type="bibr" rid="B12">De Smet et al., 2000</xref>), but the epistatic interactions with other genes remain unknown.</p>
<p>On the other hand, the gene <italic>oppA</italic> (oligopeptide-binding protein) works as a substrate-binding protein for the oligopeptide transport system (Opp), which is responsible for peptide importation. The Opp system is an ATP-binding cassette transporter. This helps in peptide absorption, giving pathogens the essential nutrients as a source of carbon, nitrogen, and amino acids. The Opp system affects many cellular processes, including internalization of quorum-sensing peptides, biofilm production, cell surface modification, and antibiotic resistance (<xref ref-type="bibr" rid="B21">Hopfe et al., 2011</xref>). The relevance of the characterization of the peptide transporter system has been described by <xref ref-type="bibr" rid="B11">Dasgupta et al. (2010)</xref>. Previous studies uncovered the novel observation that this peptide transporter modulates the innate immune response of macrophages infected (<xref ref-type="bibr" rid="B6">Cassio Barreto de Oliveira and Balan, 2020</xref>) with Mtb, but the epistatic interactions of <italic>oppA</italic> with other loci remain unknown.</p>
<p>A bacterium is able to adapt its response to host conditions, such as intracellular residence in phagocytic cells, oxidative stress, hypoxia, and carbon and nitrogen source. For this reason, evaluating interactions by bioinformatics experiments is necessary for the identification of new epistatic interactions in genes that have been previously reported in databases, such as the catalog of the WHO, or for the understanding of the epistatic interactions in Mtb before the development of new therapies.</p>
</sec>
<sec id="s3-4-2">
<title>3.4.2 Enriched GO Terms for the Epistatic Network</title>
<p>The list of ENTREZ ids of the genes of the network was used to perform a functional enrichment analysis with DAVID. From the DAVID chart report, we only considered those terms as relevant with <italic>p</italic>-value <inline-formula id="inf1">
<mml:math id="m2">
<mml:mo>&#x3c;</mml:mo>
</mml:math>
</inline-formula> 0.05 (see <xref ref-type="sec" rid="s10">Supplementary Data S4</xref> for details of the functional enrichment analysis). Biological processes of pathogenesis (GO:0009405) and cell wall organization (GO:0071555) were enriched in a subset of genes (<xref ref-type="fig" rid="F4">Figure 4</xref>). The cell wall (GO:0005618), plasma membrane (GO:0005886), cytosol (GO:0005829), and integral components of the plasma membrane (GO:0005887) were the more abundant cellular components; in this case, 63% of the genes are in the plasma membrane. Regarding molecular functions, we obtained enrichment for ATP binding (GO:0005524) and phosphoprotein phosphatase activity (GO:0004721) for some genes.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Enriched GO terms for outliers. The <italic>p</italic>-value is indicated for each term. BP &#x3d; Biological process; CC &#x3d; Cellular Component; MF &#x3d; Molecular function.</p>
</caption>
<graphic xlink:href="fmolb-09-856212-g004.tif"/>
</fig>
<p>Recently, the biomarkers of Mtb that regulate immune response have been identified to potentially develop drugs for TB. It has been previously described that the functionality of cellular components was associated with infection and verified the regulation of these cellular components as relevant regulators of the immune response in the host (<xref ref-type="bibr" rid="B30">Li et al., 2020</xref>). Thus, describing the genes involved in cellular components is crucial for understanding the interactions of bacteria with host molecules that regulate immune response.</p>
<p>In recent studies, the relevance of the structure and biogenesis-related genes of Mtb encoding glycoconjugates has been confirmed, with particular emphasis on the molecules across the different layers of the cell envelope (<xref ref-type="bibr" rid="B2">Angala et al., 2014</xref>). In addition, it has been previously stressed that ATP production is crucial for antibiotic resistance in bacteria (<xref ref-type="bibr" rid="B3">Black et al., 2014</xref>).</p>
<p>We show the enriched GO terms of genes interacting with <italic>glgB</italic> (<xref ref-type="fig" rid="F5">Figure 5B</xref>) and <italic>oppA</italic> (<xref ref-type="fig" rid="F5">Figure 5F</xref>) using circular layouts. In addition, <xref ref-type="sec" rid="s10">Supplementary Data S5</xref> also contains in table format the genes interacting with <italic>glgB</italic>, their product, and enriched GO terms; the same information is provided for <italic>oppA</italic> in <xref ref-type="sec" rid="s10">Supplementary Data S6</xref>. The layouts were generated using the start and end positions of genes reported in partitions generated by AMAS, so the arrangement and size of genes in the layout and positions of interactions reflect the pan&#x2013;genome-wide alignment. We have highlighted the interactions of <italic>glgB</italic> and <italic>oppA</italic> in red to distinguish them from the interaction of other genes (shown in gray).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Enriched GO terms of genes that interact with <italic>glgB</italic> and <italic>oppA</italic>. The arrangement and size of genes and positions of interactions reflect the pan&#x2013;genome-wide alignment. Red lines indicate interactions of <italic>glgB</italic> and <italic>oppA</italic>, whereas gray indicates the interaction of other genes. <bold>(A)</bold> Epistatic network. <bold>(B)</bold> <italic>glgB</italic> interactions (subnet). <bold>(C)</bold> Enriched cellular components of genes interacting with <italic>glgB</italic>. <bold>(D)</bold> Enriched biological processes of genes interacting with <italic>glgB</italic>. <bold>(E)</bold> Enriched molecular functions of genes interacting with <italic>glgB</italic>. <bold>(F)</bold> <italic>oppA</italic> interactions (subnet). <bold>(G)</bold> Enriched cellular components of genes interacting with <italic>oppA</italic>. <bold>(H)</bold> Enriched biological processes of genes interacting with <italic>oppA</italic>. <bold>(I)</bold> Enriched molecular functions of genes interacting with <italic>oppA</italic>.</p>
</caption>
<graphic xlink:href="fmolb-09-856212-g005.tif"/>
</fig>
<p>Both <italic>glgB</italic> and <italic>oppA</italic> epistatically interact with genes enriched with the biological processes of pathogenesis and cell wall organization (<xref ref-type="fig" rid="F5">Figures 5D,H</xref>). One of these genes is <italic>embC</italic>, which codifies for an arabinosyltransferase involved in the biosynthesis of a major component of the mycobacterial cell wall lipoarabinomannan (LAM). The characteristic manosse-capped LAM of Mtb acts as a pathogen-associated molecular pattern (PAMP), modulating the activation of phagocytic cells to control the strength of the host inflammatory immune response, while representing one of the main components in the cell wall organization. In addition, it has been described that <italic>embC</italic> is expressed as part of a polycistronic mRNA controlled by a promoting region differentially expressed depending on the stationary or hypoxia-induced persistence phase of the bacilli, highlighting the important role of this protein in the biological functions of Mtb and the complex interaction involved in cell wall regulation. Whether or not a direct interaction of <italic>embC</italic> with <italic>glgB</italic> and/or <italic>oppA</italic> exists remains an exciting question to be addressed (<xref ref-type="bibr" rid="B17">Goude et al., 2008</xref>).</p>
<p>About molecular functions, <italic>oppA</italic> and <italic>glgB</italic> interact with several genes enriched with ATP binding and with three genes enriched with phosphoprotein phosphatase activity (<xref ref-type="fig" rid="F5">Figures 5E, I</xref>). From these genes, <italic>bacA</italic> is another gene found to be interacting at the highest scores with both <italic>glgB</italic> and <italic>oppA</italic> in the network, and <italic>bacA</italic> encodes for a protein of the type IV family of ABC transporter&#x2013;type exporters; despite the structure, their function as an importer of multi-solute hydrophilic compounds, such as vitamin B12, bleomycin, and aminoglycosides, has been demonstrated due to a large occluded water-filled cavity that spans across the whole lipid membrane. In addition, it has also been demonstrated that this transporter is implicated in the maintenance of chronic infection in murine models by mediating the transport of a molecule that can directly or indirectly modulate the proinflammatory host response. Despite having different structures, BacA and OppA shared their ability to transport a wide range of substrates; in particular, the shared capacity of import peptides related to the innate immune response suggests a complex regulation and interaction of these transporters, guaranteeing the need to carry out studies at the level of gene regulation and function in the near future (<xref ref-type="bibr" rid="B14">Domenech et al., 2009</xref>; <xref ref-type="bibr" rid="B6">Cassio Barreto de Oliveira and Balan, 2020</xref>; <xref ref-type="bibr" rid="B37">Rempel et al., 2020</xref>).</p>
<p>The enriched GO terms that may be related to those associated with ATP synthase in mycobacteria are of particular interest because they contribute to efficient ATP production, and this enzyme has been validated as a target for potential pharmacological applications. In addition, mycobacterial ATP synthase and its characteristics may provide information on adaptations of bacterial energy metabolism. Mtb can survive in human macrophages for an extended time. For Mtb and other pathogenic mycobacteria strains, the blocking of ATP hydrolysis is relevant as it may represent an adaptation to its internal and external human phagosomes, where ATP, once produced, must not be used (<xref ref-type="bibr" rid="B31">Lu et al., 2014</xref>). Thus, the importance of epistatic interactions associated with ATP production in pathogenic bacteria may face exceptional challenges as a variety of pathogens need to deal with low energy conditions, such as low oxygen tensions or nutrient limitation inside the host.</p>
<p>Regarding gene interactions enriched with phosphoprotein phosphatase activity, both <italic>oppA</italic> and <italic>glgB</italic> established epistatic interaction with the <italic>pstP</italic> gene, which encodes the Serine/Threonine Protein Phosphatase PstP of Mtb. Signal sensing and transduction <italic>via</italic> phosphorylation and dephosphorylation of specific target proteins are essential for the survival of both eukaryotic and prokaryotic organisms. In the case of Mtb, 11 serine/threonine protein kinases have been described, but only the serine/threonine phosphatase, PstP, has been identified, highlighting the central role of this protein in the control of vital processes as a negative regulator of kinase activity and global serine and threonine phosphorylation (<xref ref-type="bibr" rid="B23">Iswahyudi et al., 2019</xref>).</p>
<p>Recently, other functions of PstP as a regulator of cell wall synthesis and cell division by dephosphorylation of key substrates implicated in both pathways have been described (<xref ref-type="bibr" rid="B41">Sharma et al., 2016</xref>). PstP is co-transcribed in an operon with genes involved in peptidoglycan synthesis, with protein kinases PknA and PknB that regulate cell growth and cell division and with <italic>fhaA</italic> and <italic>fhaB</italic>, which encode phosphothreonine recognition proteins that also regulate cell growth and cell division. The involvement of <italic>pstP</italic> with elements necessary for cell wall biosynthesis and their strict dependence on Mn<sup>2&#x2b;</sup> for function suggests that the interaction encountered by the computational approach could serve as a starting point for initiating investigations into the molecular interactions that regulate these common processes.</p>
<p>PstP is present as a transmembrane phosphatase and contains a 240&#x2013;amino acid intracellular catalytic domain, tethered <italic>via</italic> a single transmembrane helix to the 196-amino acid-long extracellular domain (<xref ref-type="bibr" rid="B4">Boitel et al., 2003</xref>); it remains to be elucidated if during infection and activation of the innate immune responses (e.g., respiratory burst activation), the degraded bacteria retain the phosphatase activity in the membrane fragments, and these could contribute to the dephosphorylation of the signaling pathways of the innate system, contributing to the evasion of the immune response.</p>
<p>Four cellular components were enriched for genes interacting with <italic>glgB</italic> (<xref ref-type="fig" rid="F5">Figure 5C</xref>) and <italic>oppA</italic> (<xref ref-type="fig" rid="F5">Figure 5G</xref>). The majority of genes encode proteins in the plasma membrane. For example, four genes of the group of mycobacterial membrane protein large (MmpL), <italic>mmpL2</italic>, <italic>mmpL3</italic>, <italic>mmpL5,</italic> and <italic>mmpL8</italic> have epistatic interactions with <italic>glgB</italic> and <italic>oppA</italic>. MmpL proteins export cell envelop components (such as virulence-associated lipids and siderophores) to the periplasmic space, contributing at a high level to the persistence of Mtb in the host (<xref ref-type="bibr" rid="B32">Melly and Purdy, 2019</xref>). A further study will be required to investigate the fine regulation between the import and export systems of genes identified under epistatic interaction by our approach in order to establish their relevance and biological implications.</p>
</sec>
<sec id="s3-4-3">
<title>3.4.3 Allele Distribution at Loci of Genes Interacting With <italic>glgB</italic> and <italic>oppA</italic>
</title>
<p>To observe the patterns of alleles of the interacting polymorphic loci, we show the allele distribution at interacting loci with the loci of <italic>glgB</italic> and <italic>oppA</italic> using Phandango (<xref ref-type="bibr" rid="B20">Hadfield et al., 2017</xref>). SpydrPick detected that three loci of <italic>glgB</italic> (837,764, 839,047, and 839,053) interact with 57 polymorphic loci of 56 genes. For <italic>oppA</italic>, two polymorphic loci (5,934,914 and 5,936,231) were found interacting with 38 loci of 37 genes. Tables with loci and genes are available in the <xref ref-type="sec" rid="s10">Supplementary Datas S7, S8</xref>.</p>
<p>Interacting loci and gene names are displayed as labels of columns in <xref ref-type="fig" rid="F6">Figure 6</xref> for <italic>glgB</italic> and in <xref ref-type="fig" rid="F7">Figure 7</xref> for <italic>oppA</italic>. Interacting loci are organized in sections with borders. Each section includes the interactions for each interacting locus. The border color for each section corresponds to the color of the sections in <xref ref-type="sec" rid="s10">Supplementary Data S7, S8</xref>. In <xref ref-type="fig" rid="F6">Figure 6</xref>, the first section starts with the loci 837,764 and 839,047 of <italic>glgB</italic> (glgB_837764 and glgB_839047) followed by the 29 polymorphic loci that interact with them, that is, these two loci epistatically interact with each one of the 29 loci.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Allele distribution at the loci of genes interacting with <italic>glgB</italic>. Labels of the column indicate gene name and locus. Estimated phylogeny is included on the left. Interacting loci are organized in sections with borders. The border color corresponds to the color of the sections in <xref ref-type="sec" rid="s10">Supplementary Data S7</xref>. GAR &#x3d; Genotypic Antibiotic Resistance.</p>
</caption>
<graphic xlink:href="fmolb-09-856212-g006.tif"/>
</fig>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Allele distribution at the loci of genes interacting with <italic>oppA</italic>. Labels of the column indicate gene name and locus. Estimated phylogeny is included on the left. Interacting loci are organized in sections with borders. The border color corresponds to the color of the sections in <xref ref-type="sec" rid="s10">Supplementary Data S8</xref>. GAR &#x3d; Genotypic Antibiotic Resistance.</p>
</caption>
<graphic xlink:href="fmolb-09-856212-g007.tif"/>
</fig>
<p>By observing the allele distribution of pairs of loci, we confirm that SpydrPick is able to detect, using the MI score, predictable patterns of alleles at the two loci. See, for example, the second section in <xref ref-type="fig" rid="F6">Figure 6</xref>, which only depicts the allele distribution of the locus 839,047 of <italic>glgB</italic> (glgB_839047) and the interacting locus 818,177 of <italic>gcvH</italic> (gcvH_818177). It can be noticed that when there is a C in the locus glgB_839047, there is an A in the locus gcvH_818,177, and when there is a T in the locus glgB_839047, there is a C in the locus gcvH_818,177. This predictability is quantitatively depicted by the value of <italic>MI</italic> &#x3d; 0.4201. The third section in <xref ref-type="fig" rid="F6">Figure 6</xref> exposes the allele distribution of interactions between the locus 839,053 of <italic>glgB</italic> (glgB_839053) and 27 loci of 26 genes (two loci of the gene <italic>mmpL3</italic> interact with the locus glgB_839053). In this section, we observe gaps (-) in the allele distribution of the interacting locus 5,762,846 of <italic>mprB</italic> (two component histidine-protein kinase/phosphatase MprB, <italic>MI</italic> &#x3d; 0.4743), locus 5,711,087 of <italic>mmpL5</italic> (transmembrane transport protein MmpL5 <italic>MI</italic> &#x3d; 0.4670) and locus 5,715,652 of <italic>mmpL8</italic> (integral membrane transport protein MmpL8 <italic>MI</italic> &#x3d; 0.4435).</p>
<p>In <xref ref-type="fig" rid="F7">Figure 7</xref>, we present the allele distribution of loci interacting with loci 5,934,914 and 5,936,231 of the gene <italic>oppA</italic>. The first section contains the interactions with the locus oppA_5,934,914. We notice the presence of gaps in the positions ctpV_375337 (<italic>MI</italic> &#x3d; 0.4516) and eccB3_562,698 (<italic>MI</italic> &#x3d; 0.417). <xref ref-type="fig" rid="F7">Figure 7</xref> also presents well-defined patterns of allele distribution between interacting loci.</p>
<p>The first column in both figures indicates the submitter institution (we included institutions with less than six submitted strains in the category other), and the second column points to genotypic antibiotic resistance (GAR) predicted with RGI. Estimated phylogeny is included on the left to show the diversity of the strain collection that we analyzed. For example, a clade at the bottom of the tree stands out due to its change of nucleotide in relation to the rest of the strains.</p>
<p>The application of this methodology also allowed the identification within the network of various loci in genes associated with resistance. Recently, the WHO published the first catalog of resistance-associated genetic variants for predicting relevant resistance phenotypes based on more than 38,000 WGS phenotyped isolates (<xref ref-type="bibr" rid="B46">WHO, 2021</xref>). This has allowed the identification of multiple positions associated with resistance and their classification into five groups. We use this recent classification to find antibiotic-resistant genes in the epistatic network (<xref ref-type="table" rid="T2">Table 2</xref>).</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Antibiotic-resistant genes reported by the WHO catalogue are found in the epistatic network.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Gene</th>
<th align="center">Antibiotic-resistant gene (drug)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<italic>glgB</italic> and <italic>oppA</italic>
</td>
<td align="left">
<italic>fprA</italic> (AMI)</td>
</tr>
<tr>
<td align="left">
<italic>glgB</italic> and <italic>oppA</italic>
</td>
<td align="left">
<italic>fprA</italic> (CAP)</td>
</tr>
<tr>
<td align="left">
<italic>glgB</italic> and <italic>oppA</italic>
</td>
<td align="left">
<italic>embC</italic> (EMB)</td>
</tr>
<tr>
<td align="left">
<italic>glgB</italic>
</td>
<td align="left">
<italic>katG</italic> (INH)</td>
</tr>
<tr>
<td align="left">
<italic>glgB</italic>
</td>
<td align="left">
<italic>fgd1</italic> (DLM)</td>
</tr>
<tr>
<td align="left">
<italic>glgB</italic>
</td>
<td align="left">
<italic>mmpL5</italic> (BDQ)</td>
</tr>
<tr>
<td align="left">
<italic>glgB</italic>
</td>
<td align="left">
<italic>mmpL5</italic> (CFZ)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn1">
<label>a</label>
<p>AMI &#x3d; amikacin; BDQ &#x3d; bedaquiline; CAP &#x3d; capreomycin; CFZ &#x3d; clofazimine; DLM &#x3d; delamanid; EMB &#x3d; ethambutol; INH &#x3d; isoniazid <xref ref-type="bibr" rid="B46">WHO (2021)</xref>.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In our network, an interaction was found between <italic>glgB</italic> and <italic>katG</italic>; mutations conferring monoresistance to isoniazid (INH) are common due to INH having been in clinical use since the 1950s. Nevertheless, INH resistance testing is only recently included in some specialized cartridges (e.g., Xpert MTB/XDR) and is not routinely available in such a way that if INH resistance is not detected, patients are treated as pan-suceptible, which represents a high risk of treatment failure and a greater propensity to acquire further resistance (<xref ref-type="bibr" rid="B43">Sulis and Pai, 2020</xref>).</p>
<p>From the antibiotic-resistance genes that we found in the WHO catalog, we observed that <italic>fprA</italic> (resistant to amikacin and capreomycin) and <italic>embC</italic> (resistant to ethambutol) interact with both genes <italic>glgB</italic> and <italic>oppA</italic> (<xref ref-type="table" rid="T2">Table 2</xref>). Moreover, they interact between them, forming a clique of four genes (<xref ref-type="fig" rid="F8">Figure 8</xref>). A clique depicts a network where all nodes are fully connected to each other, creating a strong interaction mechanism. This kind of epistatic interactions motivated us to visualize future studies to test new experimental hypotheses to elucidate their biological and pharmacological explanations, and the MI score seems to be a very successful approach to drive so.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Epistatic interactions between the antibiotic-resistant genes <italic>fprA</italic> and <italic>embC</italic>, and the putative targets of co-selection genes <italic>glgB</italic> and <italic>oppA</italic>.</p>
</caption>
<graphic xlink:href="fmolb-09-856212-g008.tif"/>
</fig>
</sec>
</sec>
</sec>
<sec id="s4">
<title>4 Conclusion</title>
<p>Here, we have presented the reconstruction and analysis of an epistatic network for Mtb from a pan&#x2013;genome-wide alignment by using the model-free method SpydrPick. Our approach allowed us identifying new epistatic interactions with implications in virulence, pathogenesis, transport system modulators of the immune response, and genotypic antibiotic resistance. By the analysis of the epistatic network, we identified <italic>glgB</italic> and <italic>oppA</italic> as putative targets of co-selection. These two genes epistatically interact with <italic>fprA</italic> and <italic>embC</italic>, two antibiotic-resistant genes reported in the catalog of the WHO, as resistant to ethambutol (<italic>embC</italic>) and amikacin and capreomycin (<italic>fprA</italic>). Our results highlight the importance of implementing computational approaches to elucidate new genes associated to putative epistatic interactions in Mtb.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>; further inquiries can be directed to the corresponding authors. R scripts are available at <ext-link ext-link-type="uri" xlink:href="https://github.com/biotb/epitb-net">https://github.com/biotb/epitb-net</ext-link>.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>ABPR and SFC conceptualized, designed, and conducted the investigation. ABPR analyzed the data and generated the epistatic network. YBM, SAR, PV, and SFC supervised the research. All authors wrote the manuscript. ABPR and SFC take responsibility for the manuscript. All authors read and approved the final content.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This research was partially supported by the Programa Interno de Apoyo para Proyectos de Investigaci&#xf3;n, FESC, UNAM (PIAPI 2018).</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors, and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>ABPR is a doctoral student from the <italic>Programa de Doctorado en Ciencias Biol&#xf3;gicas, Universidad Nacional Aut&#xf3;noma de M&#xe9;xico</italic> (UNAM) and received a fellowship from CONACyT (631936). PV gratefully acknowledges support by CONACyT A1-S-11242 and PAPIIT-UNAM IN209321. ABPR gratefully acknowledge the <italic>Programa de Ingenier&#xed;a Gen&#xf3;mica</italic>, CCG-UNAM, for the support during her stay (February&#x2013;December 2019). We acknowledge the support of Miguel &#xc1;ngel P&#xe9;rez Le&#xf3;n of the <italic>Laboratorio de c&#xf3;mputo de alto rendimiento, Coordinaci&#xf3;n del departamento de Matem&#xe1;ticas</italic> and of the Lansbiodyt (<italic>Laboratorio Nacional de Soluciones Biomim&#xe9;ticas para Diagn&#xf3;stico y Terapia</italic>)<italic>, Facultad de Ciencias, UNAM</italic>. <xref ref-type="fig" rid="F1">Figures 1</xref>, <xref ref-type="fig" rid="F8">8</xref> were created with <ext-link ext-link-type="uri" xlink:href="http://BioRender.com">BioRender.com</ext-link>.</p>
</ack>
<sec id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmolb.2022.856212/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmolb.2022.856212/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet7.XLSX" id="SM1" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet4.XLSX" id="SM2" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet6.XLSX" id="SM3" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet3.XLSX" id="SM4" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table1.XLSX" id="SM5" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet8.XLSX" id="SM6" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet5.XLSX" id="SM7" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.XLSX" id="SM8" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet2.XLSX" id="SM9" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alcock</surname>
<given-names>B. P.</given-names>
</name>
<name>
<surname>Raphenya</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Lau</surname>
<given-names>T. T. Y.</given-names>
</name>
<name>
<surname>Tsang</surname>
<given-names>K. K.</given-names>
</name>
<name>
<surname>Bouchard</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Edalatmand</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Card 2020: Antibiotic Resistome Surveillance with the Comprehensive Antibiotic Resistance Database</article-title>. <source>Nucleic Acids Res.</source> <volume>48</volume>, <fpage>D517</fpage>&#x2013;<lpage>D525</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz935</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Angala</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Belardinelli</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Huc-Claustre</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Wheat</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Jackson</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>The Cell Envelope Glycoconjugates of Mycobacterium Tuberculosis</article-title>. <source>Crit. Rev. Biochem. Mol. Biol.</source> <volume>49</volume>, <fpage>361</fpage>&#x2013;<lpage>399</lpage>. <pub-id pub-id-type="doi">10.3109/10409238.2014.925420</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Black</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Warren</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Louw</surname>
<given-names>G. E.</given-names>
</name>
<name>
<surname>van Helden</surname>
<given-names>P. D.</given-names>
</name>
<name>
<surname>Victor</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Kana</surname>
<given-names>B. D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Energy Metabolism and Drug Efflux in Mycobacterium Tuberculosis</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>58</volume>, <fpage>2491</fpage>&#x2013;<lpage>2503</lpage>. <pub-id pub-id-type="doi">10.1128/aac.02293-13</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boitel</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ortiz-Lombard&#xed;a</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dur&#xe1;n</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Pompeo</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Cole</surname>
<given-names>S. T.</given-names>
</name>
<name>
<surname>Cerve&#xf1;ansky</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2003</year>). <article-title>Pknb Kinase Activity Is Regulated by Phosphorylation in Two Thr Residues and Dephosphorylation by Pstp, the Cognate Phospho-Ser/thr Phosphatase, in mycobacterium Tuberculosis</article-title>. <source>Mol. Microbiol.</source> <volume>49</volume>, <fpage>1493</fpage>&#x2013;<lpage>1508</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-2958.2003.03657.x</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Borowiec</surname>
<given-names>M. L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Amas: a Fast Tool for Alignment Manipulation and Computing of Summary Statistics</article-title>. <source>PeerJ</source> <volume>4</volume>, <fpage>e1660</fpage>. <pub-id pub-id-type="doi">10.7717/peerj.1660</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cassio Barreto de Oliveira</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Balan</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The Atp-Binding Cassette (Abc) Transport Systems in Mycobacterium Tuberculosis: Structure, Function, and Possible Targets for Therapeutics</article-title>. <source>Biology</source> <volume>9</volume>, <fpage>443</fpage>. <pub-id pub-id-type="doi">10.3390/biology9120443</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chanda</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Costa</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sukumar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Van Hemert</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Walia</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Information Theory in Computational Biology: Where We Stand Today</article-title>. <source>Entropy</source> <volume>22</volume>, <fpage>627</fpage>. <pub-id pub-id-type="doi">10.3390/e22060627</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cole</surname>
<given-names>S. T.</given-names>
</name>
<name>
<surname>Brosch</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Parkhill</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Garnier</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Churcher</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Harris</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>1998</year>). <article-title>Deciphering the Biology of mycobacterium Tuberculosis from the Complete Genome Sequence</article-title>. <source>Nature</source> <volume>393</volume>, <fpage>537</fpage>&#x2013;<lpage>544</lpage>. <pub-id pub-id-type="doi">10.1038/31159</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Coscolla</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gagneux</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Consequences of Genomic Diversity in mycobacterium Tuberculosis</article-title>. <source>Semin. Immunol.</source> <volume>26</volume>, <fpage>431</fpage>&#x2013;<lpage>444</lpage>. <pub-id pub-id-type="doi">10.1016/j.smim.2014.09.012</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cover</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2006</year>). <source>Elements of Information Theory</source>. <publisher-loc>New Jersey</publisher-loc>: <publisher-name>Wiley-Interscience</publisher-name>. </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dasgupta</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sureka</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Mitra</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Saha</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Sanyal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>A. K.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>An Oligopeptide Transporter of Mycobacterium Tuberculosis Regulates Cytokine Release and Apoptosis of Infected Macrophages</article-title>. <source>PloS one</source> <volume>5</volume>, <fpage>e12225</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0012225</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>De Smet</surname>
<given-names>K. A. L.</given-names>
</name>
<name>
<surname>Weston</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>I. N.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>D. B.</given-names>
</name>
<name>
<surname>Robertson</surname>
<given-names>B. D.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Three Pathways for Trehalose Biosynthesis in Mycobacteria</article-title>. <source>Microbiology</source> <volume>146</volume>, <fpage>199</fpage>&#x2013;<lpage>208</lpage>. <pub-id pub-id-type="doi">10.1099/00221287-146-1-199</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dkhar</surname>
<given-names>H. K.</given-names>
</name>
<name>
<surname>Gopalsamy</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Loharch</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kaur</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bhutani</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Saminathan</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Discovery of <italic>Mycobacterium tuberculosis</italic> &#x3b1;-1,4-Glucan Branching Enzyme (GlgB) Inhibitors by Structure- and Ligand-Based Virtual Screening</article-title>. <source>J. Biol. Chem.</source> <volume>290</volume>, <fpage>76</fpage>&#x2013;<lpage>89</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.m114.589200</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Domenech</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kobayashi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>LeVier</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Walker</surname>
<given-names>G. C.</given-names>
</name>
<name>
<surname>Barry</surname>
<given-names>C. E.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>BacA, an ABC Transporter Involved in Maintenance of Chronic Murine Infections with <italic>Mycobacterium tuberculosis</italic>
</article-title>. <source>J. Bacteriol.</source> <volume>191</volume>, <fpage>477</fpage>&#x2013;<lpage>485</lpage>. <pub-id pub-id-type="doi">10.1128/JB.01132-08</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Drost</surname>
<given-names>H. G.</given-names>
</name>
<name>
<surname>Paszkowski</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Biomartr: Genomic Data Retrieval with R</article-title>. <source>Bioinformatics</source> <volume>33</volume>, <fpage>1216</fpage>&#x2013;<lpage>1217</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btw821</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gonzalo-Asensio</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Malaga</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Pawlik</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Astarie-Dequeker</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Passemar</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Moreau</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Evolutionary History of Tuberculosis Shaped by Conserved Mutations in the Phopr Virulence Regulator</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>111</volume>, <fpage>11491</fpage>&#x2013;<lpage>11496</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1406693111</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goude</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Amin</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>Chatterjee</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Parish</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>The Critical Role of Embc in mycobacterium Tuberculosis</article-title>. <source>J. Bacteriol.</source> <volume>190</volume>, <fpage>4335</fpage>&#x2013;<lpage>4341</lpage>. <pub-id pub-id-type="doi">10.1128/jb.01825-07</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gouy</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gautier</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Attimonelli</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lanave</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Paola</surname>
<given-names>G. d.</given-names>
</name>
</person-group> (<year>1985</year>). <article-title>Acnuc &#x2013; A Portable Retrieval System For Nucleic Acid Sequence Databases: Logical And Physical Designs And Usage</article-title>. <source>Bioinformatics</source> <volume>1</volume>, <fpage>167</fpage>&#x2013;<lpage>172</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/1.3.167</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gupta</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Agrawal</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>New Players in Immunity to Tuberculosis: the Host Microbiome, Lung Epithelium, and Innate Immune Cells</article-title>. <source>Front. Immunol.</source> <volume>9</volume>, <fpage>709</fpage>. <pub-id pub-id-type="doi">10.3389/fimmu.2018.00709</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hadfield</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Croucher</surname>
<given-names>N. J.</given-names>
</name>
<name>
<surname>Goater</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Abudahab</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Aanensen</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Harris</surname>
<given-names>S. R.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Phandango: an Interactive Viewer for Bacterial Population Genomics</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>292</fpage>&#x2013;<lpage>293</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx610</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hopfe</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dahlmanns</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Henrich</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>In Mycoplasma Hominis the Oppa-Mediated Cytoadhesion Depends on its Atpase Activity</article-title>. <source>BMC Microbiol.</source> <volume>11</volume>, <fpage>185</fpage>&#x2013;<lpage>189</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2180-11-185</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Sherman</surname>
<given-names>B. T.</given-names>
</name>
<name>
<surname>Lempicki</surname>
<given-names>R. A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Systematic and Integrative Analysis of Large Gene Lists Using David Bioinformatics Resources</article-title>. <source>Nat. Protoc.</source> <volume>4</volume>, <fpage>44</fpage>&#x2013;<lpage>57</lpage>. <pub-id pub-id-type="doi">10.1038/nprot.2008.211</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iswahyudi, Mukamolova</surname>
<given-names>G. V.</given-names>
</name>
<name>
<surname>Straatman-Iwanowska</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Allcock</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Ajuh</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Turapov</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Mycobacterial Phosphatase Pstp Regulates Global Serine Threonine Phosphorylation and Cell Division</article-title>. <source>Sci. Rep.</source> <volume>9</volume>, <fpage>8337</fpage>&#x2013;<lpage>8411</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-44841-9</pub-id> <ext-link ext-link-type="uri" xlink:href="https://www.nature.com/articles/s41598-019-44841-9#citeas">https://www.nature.com/articles/s41598-019-44841-9#citeas</ext-link>. </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Sherman</surname>
<given-names>B. T.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Stephens</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Baseler</surname>
<given-names>M. W.</given-names>
</name>
<name>
<surname>Lane</surname>
<given-names>H. C.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>DAVID-WS: a Stateful Web Service to Facilitate Gene/Protein List Analysis</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>1805</fpage>&#x2013;<lpage>1806</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bts251</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kavvas</surname>
<given-names>E. S.</given-names>
</name>
<name>
<surname>Catoiu</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mih</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Yurkovich</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Seif</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Dillon</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Machine Learning and Structural Analysis of mycobacterium Tuberculosis Pan-Genome Identifies Genetic Signatures of Antibiotic Resistance</article-title>. <source>Nat. Commun.</source> <volume>9</volume>, <fpage>4306</fpage>&#x2013;<lpage>4309</lpage>. <pub-id pub-id-type="doi">10.1038/s41467-018-06634-y</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Kohl</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wiese</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Warscheid</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2011</year>). &#x201c;<article-title>Cytoscape: Software for Visualization and Analysis of Biological Networks</article-title>,&#x201d; in <source>Data Mining in Proteomics</source> (<publisher-name>Springer</publisher-name>), <fpage>291</fpage>&#x2013;<lpage>303</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-60761-987-1_18</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kozlov</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Darriba</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Flouri</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Morel</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Stamatakis</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>RAxML-NG: a Fast, Scalable and User-Friendly Tool for Maximum Likelihood Phylogenetic Inference</article-title>. <source>Bioinformatics</source> <volume>35</volume>, <fpage>4453</fpage>&#x2013;<lpage>4455</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz305</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lerner</surname>
<given-names>T. R.</given-names>
</name>
<name>
<surname>Borel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gutierrez</surname>
<given-names>M. G.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>The Innate Immune Response in Human Tuberculosis</article-title>. <source>Cell Microbiol</source> <volume>17</volume>, <fpage>1277</fpage>&#x2013;<lpage>1285</lpage>. <pub-id pub-id-type="doi">10.1111/cmi.12480</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Letunic</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Bork</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Interactive Tree of Life (iTOL) V5: an Online Tool for Phylogenetic Tree Display and Annotation</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>W293</fpage>&#x2013;<lpage>W296</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkab301</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lv</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Gene Network in Pulmonary Tuberculosis Based on Bioinformatic Analysis</article-title>. <source>BMC Infect. Dis.</source> <volume>20</volume>, <fpage>612</fpage>&#x2013;<lpage>711</lpage>. <pub-id pub-id-type="doi">10.1186/s12879-020-05335-6</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Lill</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bald</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Atp Synthase in Mycobacteria: Special Features and Implications for a Function as Drug Target</article-title>. <source>Biochim. Biophys. Acta (Bba) - Bioenerg.</source> <volume>1837</volume>, <fpage>1208</fpage>&#x2013;<lpage>1218</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbabio.2014.01.022</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Melly</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Purdy</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Mmpl Proteins in Physiology and Pathogenesis of m. tuberculosis</article-title>. <source>Microorganisms</source> <volume>7</volume>, <fpage>70</fpage>. <pub-id pub-id-type="doi">10.3390/microorganisms7030070</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Page</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Cummins</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Hunt</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>V. K.</given-names>
</name>
<name>
<surname>Reuter</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Holden</surname>
<given-names>M. T. G.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Roary: Rapid Large-Scale Prokaryote pan Genome Analysis</article-title>. <source>Bioinformatics</source> <volume>31</volume>, <fpage>3691</fpage>&#x2013;<lpage>3693</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv421</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Page</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Taylor</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Delaney</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Soares</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Seemann</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Keane</surname>
<given-names>J. A.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Snp-sites: Rapid Efficient Extraction of Snps from Multi-Fasta Alignments</article-title>. <source>Microb. Genomics</source> <volume>2</volume>, <fpage>e000056</fpage>. <pub-id pub-id-type="doi">10.1099/mgen.0.000056</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pattengale</surname>
<given-names>N. D.</given-names>
</name>
<name>
<surname>Alipour</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bininda-Emonds</surname>
<given-names>O. R. P.</given-names>
</name>
<name>
<surname>Moret</surname>
<given-names>B. M. E.</given-names>
</name>
<name>
<surname>Stamatakis</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>How many Bootstrap Replicates Are Necessary?</article-title> <source>J. Comput. Biol.</source> <volume>17</volume>, <fpage>337</fpage>&#x2013;<lpage>354</lpage>. <pub-id pub-id-type="doi">10.1089/cmb.2009.0179</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pensar</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Puranen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Arnold</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>MacAlasdair</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Kuronen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tonkin-Hill</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Genome-Wide Epistasis and Co-Selection Study Using Mutual Information</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>e112</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz656</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rempel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gati</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Nijland</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Thangaratnarajah</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Karyolaimos</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>de Gier</surname>
<given-names>J. W.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A Mycobacterial Abc Transporter Mediates the Uptake of Hydrophilic Compounds</article-title>. <source>Nature</source> <volume>580</volume>, <fpage>409</fpage>&#x2013;<lpage>412</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-020-2072-8</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sackton</surname>
<given-names>T. B.</given-names>
</name>
<name>
<surname>Hartl</surname>
<given-names>D. L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Genotypic Context and Epistasis in Individuals and Populations</article-title>. <source>Cell</source> <volume>166</volume>, <fpage>279</fpage>&#x2013;<lpage>287</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2016.06.047</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Satta</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Lipman</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>G. P.</given-names>
</name>
<name>
<surname>Arnold</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kon</surname>
<given-names>O. M.</given-names>
</name>
<name>
<surname>McHugh</surname>
<given-names>T. D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>
<italic>Mycobacterium tuberculosis</italic> and Whole-Genome Sequencing: How Close Are We to Unleashing its Full Potential?</article-title> <source>Clin. Microbiol. Infect.</source> <volume>24</volume>, <fpage>604</fpage>&#x2013;<lpage>609</lpage>. <pub-id pub-id-type="doi">10.1016/j.cmi.2017.10.030</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seemann</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Prokka: Rapid Prokaryotic Genome Annotation</article-title>. <source>Bioinformatics</source> <volume>30</volume>, <fpage>2068</fpage>&#x2013;<lpage>2069</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu153</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharma</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Arora</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>L. K.</given-names>
</name>
<name>
<surname>Gangwal</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sajid</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Molle</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Serine/threonine Protein Phosphatase Pstp of mycobacterium Tuberculosis Is Necessary for Accurate Cell Division and Survival of Pathogen</article-title>. <source>J. Biol. Chem.</source> <volume>291</volume>, <fpage>24215</fpage>&#x2013;<lpage>24230</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.m116.754531</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Skwark</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Croucher</surname>
<given-names>N. J.</given-names>
</name>
<name>
<surname>Puranen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chewapreecha</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Pesonen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y. Y.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Interacting Networks of Resistance, Virulence and Core Machinery Genes Identified by Genome-wide Epistasis Analysis</article-title>. <source>Plos Genet.</source> <volume>13</volume>, <fpage>e1006508</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1006508</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sulis</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Pai</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Isoniazid-resistant Tuberculosis: A Problem We Can No Longer Ignore</article-title>. <source>Plos Med.</source> <volume>17</volume>, <fpage>e1003023</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pmed.1003023</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Trauner</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Borrell</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Reither</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Gagneux</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Evolution of Drug Resistance in Tuberculosis: Recent Progress and Implications for Diagnosis and Therapy</article-title>. <source>Drugs</source> <volume>74</volume>, <fpage>1063</fpage>&#x2013;<lpage>1072</lpage>. <pub-id pub-id-type="doi">10.1007/s40265-014-0248-y</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Tukey</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1977</year>). <source>Exploratory Data Analysis</source>. <publisher-loc>Reading, Massachusetts</publisher-loc>: <publisher-name>Addison-Wesley</publisher-name>. </citation>
</ref>
<ref id="B46">
<citation citation-type="book">
<collab>WHO</collab> (<year>2021</year>). <source>Catalogue of Mutations in mycobacterium Tuberculosis Complex and Their Association with Drug Resistance</source>. <publisher-loc>Geneva</publisher-loc>: <publisher-name>World Health Organization</publisher-name>. </citation>
</ref>
</ref-list>
</back>
</article>