<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2025.1663069</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Drug selection based on pan-genomics genetic features of <italic>Mycobacterium tuberculosis</italic></article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Sun</surname>
<given-names>Xiangcheng</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn0007"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1335024/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Xu</surname>
<given-names>Panpan</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn0007"><sup>&#x2020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Shi</surname>
<given-names>Yun</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/898940/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wang</surname>
<given-names>Ning</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Yan</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Institute of Biopharmaceuticals, West China Hospital of Sichuan University</institution>, <addr-line>Chengdu</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Laboratory of Liver Surgery, West China Hospital of Sichuan University</institution>, <addr-line>Chengdu</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0008">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2121978/overview">Matteo Calcagnile</ext-link>, University of Salento, Italy</p>
</fn>
<fn fn-type="edited-by" id="fn0009">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/756466/overview">Shima Hadifar</ext-link>, Pasteur Institute of Iran (PII), Iran</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/975018/overview">Sushanta Deb</ext-link>, Washington State University, United States</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Ning Wang, <email>wangning@wchscu.cn</email>; Yan Li, <email>lliyan@hotmail.com</email></corresp>
<fn fn-type="equal" id="fn0007"><p><sup>&#x2020;</sup>These authors have contributed equally to this work</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>02</day>
<month>09</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1663069</elocation-id>
<history>
<date date-type="received">
<day>10</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>08</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Sun, Xu, Shi, Wang and Li.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Sun, Xu, Shi, Wang and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Tuberculosis, caused by <italic>Mycobacterium tuberculosis</italic>, is a severe and persistent global public health issue, particularly exacerbated by the emergence of multidrug-resistant and extensively drug-resistant strains. This study employed pan-genomic approaches to analyze different strains with various resistance profiles, examining the diversity of bacterial genetic evolution in relation to mutations in resistance-related genes. The findings indicate that resistance-related genes are mostly core genes (94%), with a preference for base mutations closely associated with nonsynonymous mutations at resistance sites. Interestingly, while the majority of drugs induce positive selection in target genes, the tlyA gene under the influence of amikacin (AMI) undergoes passive selection. Cluster analysis of target genes suggests consistency between SNP clusters and drug-resistant clusters, revealing a strong correlation between bacterial evolutionary branches and resistance profiles. Consequently, based on pan-genome evolutionary characteristics, we identified the drug-resistant mutation pattern (DRMP) that can serve as a molecular fingerprint and indicator for drug sensitivity, aiding in the assessment and guidance of drug selection for treating different strains and the formulation of individualized treatment plans. This research not only enhances our understanding of the mechanisms of drug resistance in <italic>M. tuberculosis</italic> but also offers new perspectives for the development of new drugs, which is crucial for global tuberculosis control.</p>
</abstract>
<kwd-group>
<kwd><italic>M</italic><italic>. tuberculosis</italic></kwd>
<kwd>drug resistance</kwd>
<kwd>genetic diversity</kwd>
<kwd>DRMP</kwd>
<kwd>therapeutic and control strategies</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="0"/>
<equation-count count="1"/>
<ref-count count="71"/>
<page-count count="14"/>
<word-count count="8947"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Antimicrobials, Resistance and Chemotherapy</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Tuberculosis (TB), a historically pervasive and enduring infectious disease, continues to pose a formidable challenge to global public health (<xref ref-type="bibr" rid="ref14">Dheda et al., 2014</xref>; <xref ref-type="bibr" rid="ref57">Shaku and Bishai, 2022</xref>; <xref ref-type="bibr" rid="ref22">Farhat et al., 2024</xref>; <xref ref-type="bibr" rid="ref60">Shu and Liu, 2024</xref>), remaining one of the leading causes of mortality worldwide. Despite the continuous optimization of TB prevention and control strategies over the past few decades, the emergence of drug-resistant <italic>M. tuberculosis</italic> has significantly undermined these efforts (<xref ref-type="bibr" rid="ref18">Ehrt et al., 2018</xref>; <xref ref-type="bibr" rid="ref36">Koch and Mizrahi, 2018</xref>; <xref ref-type="bibr" rid="ref22">Farhat et al., 2024</xref>; <xref ref-type="bibr" rid="ref60">Shu and Liu, 2024</xref>). The appearance of multidrug-resistant (MDR) and extensively drug-resistant (XDR) strains (<xref ref-type="bibr" rid="ref68">Wulandari et al., 2024</xref>) has particularly limited treatment options, prolonged treatment durations, increased costs, and substantially diminished treatment efficacy (<xref ref-type="bibr" rid="ref25">Gandhi et al., 2010</xref>; <xref ref-type="bibr" rid="ref61">Singh et al., 2020</xref>; <xref ref-type="bibr" rid="ref59">Shitikov and Bespiatykh, 2023</xref>).</p>
<p>The rapid advancement of molecular biology technologies, especially the widespread application of high-throughput sequencing techniques, has markedly enhanced our understanding of the drug resistance mechanisms in <italic>M. tuberculosis</italic> (<xref ref-type="bibr" rid="ref28">Hanif and Arora, 2022</xref>). Researchers have identified various gene mutations associated with drug resistance in <italic>M. tuberculosis</italic>. These mutations involve genes critical for the clinical treatment of TB, such as: mutations in the embB and embC genes associated with ethambutol (EMB) resistance (<xref ref-type="bibr" rid="ref62">Sreevatsan et al., 1997</xref>; <xref ref-type="bibr" rid="ref55">Ramaswamy et al., 2000</xref>; <xref ref-type="bibr" rid="ref40">Lee et al., 2004</xref>; <xref ref-type="bibr" rid="ref64">Srivastava et al., 2006</xref>; <xref ref-type="bibr" rid="ref63">Srivastava et al., 2009</xref>); specific mutations in the inhA and katG genes related to isoniazid (INH) and ethionamide (ETH) resistance (<xref ref-type="bibr" rid="ref39">Lee et al., 2000</xref>; <xref ref-type="bibr" rid="ref47">Morlock et al., 2003</xref>; <xref ref-type="bibr" rid="ref38">Lavender et al., 2005</xref>; <xref ref-type="bibr" rid="ref56">Sekiguchi et al., 2007</xref>); mutations within the ethA and inhA structural genes also linked to ETH resistance (<xref ref-type="bibr" rid="ref38">Lavender et al., 2005</xref>); and high double-point mutations in the gyrA gene indicating the emergence of fluoroquinolone resistance (<xref ref-type="bibr" rid="ref4">Aubry et al., 2006</xref>; <xref ref-type="bibr" rid="ref58">Shi et al., 2006</xref>), among others. The researchers have found that the genetic diversity of <italic>M. tuberculosis</italic> is crucial for its evolutionary selection under drug pressure, understanding these genetic evolutionary patterns is significantly meaningful for preventing drug resistance and guiding medication selection (<xref ref-type="bibr" rid="ref48">M&#x00FC;ller et al., 2013</xref>; <xref ref-type="bibr" rid="ref19">Eldholm et al., 2014</xref>; <xref ref-type="bibr" rid="ref12">Cohen et al., 2015</xref>; <xref ref-type="bibr" rid="ref24">Gagneux, 2018</xref>). However, despite some progress in previous research, a systematic understanding of how <italic>M. tuberculosis</italic> evolves under different pressures is still lacking.</p>
<p>Therefore, this study employed pan-genomic analysis techniques on strains from different sources and with varying drug resistance profiles to comprehensively explore the genetic diversity of <italic>M. tuberculosis</italic> and its association with drug resistance. By examining the evolutionary trajectory of drug-resistant related genes, we aim to uncover how these genetic variations impact the drug resistance of strains. This research not only aids in deepening our comprehension of the drug resistance mechanisms in <italic>M. tuberculosis</italic>, but also showcases patterns of drug-related mutations, offering a scientific basis for prevention and control strategies and facilitating the implementation of precision treatment.</p>
</sec>
<sec sec-type="materials|methods" id="sec2">
<label>2</label>
<title>Materials and methods</title>
<sec id="sec3">
<label>2.1</label>
<title>Data collection and processing</title>
<p>We obtained a diverse collection of genomic data from two sources within the NCBI database, which cover the last two decades from August 2004 to May 2024. Firstly, we acquired raw sequencing reads from 669 sequenced <italic>M. tuberculosis</italic> isolates available through the NCBI Sequence Read Archive (SRA).<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref> These data provided a broad representation of the genetic diversity present in <italic>M. tuberculosis</italic> strains worldwide. Additionally, we included an extra 470 fully assembled <italic>M. tuberculosis</italic> isolates from the NCBI Assembly database<xref ref-type="fn" rid="fn0002"><sup>2</sup></xref> to enrich our analysis with fully annotated genomic sequences (<xref rid="SM1" ref-type="supplementary-material">Supplementary Table S1</xref>). Sequencing reads were quality-trimmed with Trimmomatic v0.39 (<xref ref-type="bibr" rid="ref6">Bolger et al., 2014</xref>) to remove adapters and low-quality bases. High-quality reads were aligned to the <italic>M. tuberculosis</italic> H37Rv reference genome (NCBI: NC_000962.3) using BWA-MEM v0.7.18 (<xref ref-type="bibr" rid="ref33">Jung and Han, 2022</xref>) with default parameters. Resulting alignments (SAM format) were converted to sorted BAM files using SAMtools v1.19.2 (<xref ref-type="bibr" rid="ref13">Danecek et al., 2021</xref>) and subsequently transformed into FASTQ format using BEDTools v2.31.1 (bamtofastq) (<xref ref-type="bibr" rid="ref54">Quinlan and Hall, 2010</xref>) with default settings. <italic>De novo</italic> genome assembly was performed on processed reads using SOAPdenovo2 v2.41 (<xref ref-type="bibr" rid="ref44">Luo et al., 2012</xref>) with optimized parameters -K 127 -p 16 -F -R -u (asm_flags&#x202F;=&#x202F;3, rank&#x202F;=&#x202F;1; other parameters default). Scaffolding leveraged paired-end read information, and internal gaps were closed using GapCloser v1.12 (<xref ref-type="bibr" rid="ref44">Luo et al., 2012</xref>) with parameters -l 150 -p 30 -t 16. Assembly completeness was assessed with BUSCO v5.4.5 (<xref ref-type="bibr" rid="ref45">Manni et al., 2021</xref>) using the bacteria_odb10 lineage dataset<xref ref-type="fn" rid="fn0003"><sup>3</sup></xref> in genome mode with parameters -m geno -c 16 --long.</p>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>Gene annotation</title>
<p>Reference protein-coding sequences (CDSs) from <italic>M. tuberculosis</italic> H37Rv (NCBI: NC_000962.3) were extracted from GenBank annotations, converted to nucleotide FASTA format with retention of original locus tags and functional descriptions, and compiled into a custom BLAST database using makeblastdb v2.14.0 (<xref ref-type="bibr" rid="ref8">Camacho et al., 2009</xref>). This database was filtered to exclude pseudogenes and CDSs &#x003C;100&#x202F;bp. Orthologous genes were identified via BLASTn (<xref ref-type="bibr" rid="ref8">Camacho et al., 2009</xref>) alignment against the target genome assembly under stringent parameters: <italic>E</italic>-value &#x2264;1&#x202F;&#x00D7;&#x202F;10<sup>&#x2212;5</sup>, minimum nucleotide identity 70%, and query/subject coverage &#x2265;80% (-<italic>E</italic>-value 1&#x202F;&#x00D7;&#x202F;10<sup>&#x2212;5</sup> -perc_identity 70 -qcov_hsp_perc 80). Matches fulfilling all criteria inherited H37Rv-derived locus tags and functional annotations.</p>
</sec>
<sec id="sec5">
<label>2.3</label>
<title>Pan-genome analysis</title>
<p>Pan-genome analysis was performed using IPGA (integrated prokaryotes genome and pan-genome analysis) (<xref ref-type="bibr" rid="ref43">Liu et al., 2022</xref>), a robust tool for prokaryotic genome and pan-genome analysis. Input genome files underwent automatic quality control, retaining genomes with &#x003E;90% completeness and &#x003C;5% contamination for downstream analysis. Genes were predicted in quality-controlled genomes using IPGA, and the resulting predictions served as input for the pan-genome analysis module. Within this module, the integrated software packages PanOCT (<xref ref-type="bibr" rid="ref30">Inman et al., 2019</xref>), OrthoMCL (<xref ref-type="bibr" rid="ref42">Li et al., 2003</xref>), Roary (<xref ref-type="bibr" rid="ref50">Page et al., 2015</xref>), panX (<xref ref-type="bibr" rid="ref15">Ding et al., 2017</xref>), OrthoFinder (<xref ref-type="bibr" rid="ref20">Emms and Kelly, 2015</xref>), Panaroo (<xref ref-type="bibr" rid="ref65">Tonkin-Hill et al., 2020</xref>), and PPanGGoLiN (<xref ref-type="bibr" rid="ref26">Gautreau et al., 2020</xref>) were employed with the following parameters: Identity&#x202F;=&#x202F;70, Ratio (core)&#x202F;=&#x202F;0.95, Support&#x202F;=&#x202F;&#x2212;1. Pan-genome profiles generated by the different tools were subsequently processed by the optimal selection module to identify the highest-quality pan-genome profile. To systematically characterize the potential for horizontal gene transfer within our assembled genomes, we identified and annotated mobile genetic elements (MGEs) using the mobileOG-db module (<xref ref-type="bibr" rid="ref7">Brown et al., 2022</xref>) integrated within the Proksee v1.1.3 platform (<xref ref-type="bibr" rid="ref27">Grant et al., 2023</xref>). This approach leveraged the curated mobileOG database, a comprehensive resource specifically designed for MGE annotation and encompassing protein families associated with plasmids, bacteriophages, and integrative elements (including functions such as conjugation, transposition, replication, and integration/excision). Assembled genomic sequences (FASTA format) were analyzed within Proksee, where the module employed HMMER3 (hmmscan) (<xref ref-type="bibr" rid="ref23">Finn et al., 2011</xref>) to query predicted protein sequences against the database&#x2019;s profile hidden Markov models (HMMs). Significant hits were filtered using default thresholds (<italic>E</italic>-value &#x2264; 1&#x202F;&#x00D7;&#x202F;10<sup>&#x2212;5</sup>, alignment coverage) to assign functional annotations and categorize MGE-associated genes. Putative MGEs were inferred based on the co-localization and clustering of multiple annotated genes encoding related functions. Finally, customizable circular genome plots were generated using Proksee integrated visualization capabilities to depict the genomic context, location, and distribution of identified MGE-associated genes relative to other features, exporting these as high-resolution vector graphics (SVG) for publication.</p>
</sec>
<sec id="sec6">
<label>2.4</label>
<title>SNP identification and analysis</title>
<p>Single nucleotide polymorphism (SNP) identification was performed using an integrated pipeline with BCFtools v1.15.1 (<xref ref-type="bibr" rid="ref13">Danecek et al., 2021</xref>) and GATK v4.2.6.1 (<xref ref-type="bibr" rid="ref66">Van der Auwera et al., 2013</xref>) for variant calling, followed by error correction and lineage-specific variant annotation using TB-gen v0.6.1.<xref ref-type="fn" rid="fn0004"><sup>4</sup></xref> Genetic clusters were defined by grouping isolates exhibiting a pairwise SNP distance &#x2264;12, calculated from whole-genome SNP matrices generated with Parsnp v2.0.5 (<xref ref-type="bibr" rid="ref35">Kille et al., 2024</xref>). For each cluster, the mutation rate was calculated as the average number of SNPs per site per isolate, derived from high-quality SNP calls (QUAL &#x003E; 30, DP &#x003E; 10, GQ &#x003E; 20) within all isolates of the cluster. This rate was computed by dividing the total number of identified SNPs by the product of the number of isolates in the cluster and the core genome length (4.1&#x202F;Mb). To identify cluster-specific SNP loci, a merged multi-sample VCF file (generated using BCFtools merge) containing variants from all clusters served as input. Cluster-specific loci were defined as genomic positions harboring variants present exclusively in one cluster and absent in all others. Variants private to each cluster were isolated using BCFtools isec and subsequently validated against the TB-gen database to exclude known lineage-defining markers, ensuring the identified uniqueness was specific to the cluster context.</p>
</sec>
<sec id="sec7">
<label>2.5</label>
<title>Predicted drug resistance</title>
<p>First, we used the TB-AMRpred pipeline<xref ref-type="fn" rid="fn0005"><sup>5</sup></xref> (<xref ref-type="bibr" rid="ref51">Pal and Mohanty, 2025</xref>) to predict antimicrobial drug resistance in <italic>M. tuberculosis</italic> based on whole genome sequences. Then, we combined this with the tbAnnotator pipeline<xref ref-type="fn" rid="fn0006"><sup>6</sup></xref> for analysis. By running the tbAnnotator.py script, we queried a database constructed from literature-based drug susceptibility experimental data and scored new SNPs, generating text in json format. To more intuitively display the predicted drug resistance results, we further regenerated HTML reports using the htmlReportRegenerator.py script.</p>
</sec>
<sec id="sec8">
<label>2.6</label>
<title>Whole-genome phylogenetic reconstruction</title>
<p>Whole-genome phylogenies were inferred using RealPhy v1.13 (<xref ref-type="bibr" rid="ref5">Bertels et al., 2014</xref>) (parameters: -minlen 50, -minqual 20) from high-quality genome assemblies (FASTA format; assessed with CheckM v1.2.3 (<xref ref-type="bibr" rid="ref52">Parks et al., 2015</xref>): completeness &#x003E;95%, contamination &#x003C;5%). This reference-guided approach generated a multiple sequence alignment incorporating SNPs identified <italic>de novo</italic> and via reference mapping. Gap-rich sites (&#x003E;90% gaps) were removed using trimAl v1.5.0 (-gt 0.1) (<xref ref-type="bibr" rid="ref10">Capella-Guti&#x00E9;rrez et al., 2009</xref>). Maximum-likelihood phylogenetic reconstruction was performed with IQ-TREE v2.3.4 (<xref ref-type="bibr" rid="ref46">Minh et al., 2020</xref>), employing the ModelFinder-Plus algorithm (-m MFP&#x202F;+&#x202F;ASC) (<xref ref-type="bibr" rid="ref34">Kalyaanamoorthy et al., 2017</xref>) to select the optimal substitution model while accounting for ascertainment bias (ASC). Branch support was assessed using 1,000 ultrafast bootstrap replicates (UFBoot; -B 1000 --bnni) and the Shimodaira-Hasegawa approximate likelihood ratio test (SH-aLRT; -alrt 1,000); clades with UFBoot &#x2265;95% and SH-aLRT &#x2265;80% were considered well-supported. The entire workflow was replicated three times to confirm topological consistency. Final tree visualization and annotation utilized iTOL v6 (accessible at <ext-link xlink:href="https://itol.embl.de/" ext-link-type="uri">https://itol.embl.de/</ext-link>) (<xref ref-type="bibr" rid="ref41">Letunic and Bork, 2021</xref>).</p>
</sec>
<sec id="sec9">
<label>2.7</label>
<title>Amino acid mutation frequency quantification</title>
<p>Amino acid mutation frequencies were determined by calculating the percentage of alterations observed at mutated positions in analyzed resistance gene sites. A &#x201C;gain&#x201D; event denotes the introduction of a specific amino acid at a position where it was previously absent, while a &#x201C;loss&#x201D; event indicates the replacement of a specific amino acid originally present at that position. The gain frequency (Freq<sub>gain</sub>) and loss frequency (Freq<sub>loss</sub>) for each amino acid were calculated as:</p>
<disp-formula id="E1">
<mml:math id="M1">
<mml:msub>
<mml:mtext>Freq</mml:mtext>
<mml:mrow>
<mml:mtext>gain</mml:mtext>
<mml:mo>/</mml:mo>
<mml:mtext>loss</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
<mml:msub>
<mml:mtext>Count</mml:mtext>
<mml:mrow>
<mml:mtext>gain</mml:mtext>
<mml:mo>/</mml:mo>
<mml:mtext>loss</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
<mml:msub>
<mml:mtext>Total</mml:mtext>
<mml:mtext>mutated</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:math>
</disp-formula>
<p>where: <inline-formula>
<mml:math id="M2">
<mml:mo>&#x2211;</mml:mo>
<mml:msub>
<mml:mtext>Count</mml:mtext>
<mml:mrow>
<mml:mtext>gain</mml:mtext>
<mml:mo>/</mml:mo>
<mml:mtext>loss</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> =&#x202F;Total number of gain/loss events across all sequences, <inline-formula>
<mml:math id="M3">
<mml:mo>&#x2211;</mml:mo>
<mml:msub>
<mml:mtext>Total</mml:mtext>
<mml:mtext>mutated</mml:mtext>
</mml:msub>
</mml:math>
</inline-formula> =&#x202F;Total number of mutated amino acid positions in all sequences. This metric reflects the proportion of gain or loss events per amino acid relative to all observed mutations.</p>
</sec>
<sec id="sec10">
<label>2.8</label>
<title>Evolutionary selection pressure on drug resistance-associated genes</title>
<p>To assess the selection pressure acting on these protein-coding genes, we extracted the precise genomic coordinates of the target resistance genes (the 31 genes identified through resistance analysis) from species-specific annotation files using an awk script, generating corresponding BED-format files. Nucleotide coding sequences (CDS) were then batch-extracted from the assembled genomes based on these coordinates using bedtools getfasta -s -name+. These CDS sequences were subsequently translated into amino acid sequences in batch using a custom Python script employing the Biopython library. Finally, the ratios of non-synonymous (<italic>K</italic><sub>a</sub>) to synonymous (<italic>K</italic><sub>s</sub>) substitution rates (<italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub>) were calculated batch-wise using the ParaAT pipeline (<xref ref-type="bibr" rid="ref71">Zhang et al., 2012</xref>), where sequence alignment was performed by MAFFT v7.526 using default parameters, and <italic>K</italic><sub>a</sub> and <italic>K</italic><sub>s</sub> values were computed by <italic>K</italic><sub>a</sub><italic>K</italic><sub>s</sub>_Calculator v3.0 (<xref ref-type="bibr" rid="ref69">Zhang, 2022</xref>) using default parameters. <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub> ratios were interpreted as follows: <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub>&#x202F;&#x003E;&#x202F;1 indicates positive selection (favoring fixation of amino acid-altering mutations); <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub>&#x202F;=&#x202F;1 indicates neutral evolution (random fixation of mutations); <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub>&#x202F;&#x003C;&#x202F;1 indicates purifying selection (removal of amino acid-altering mutations). We visualized the results by plotting <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub> density plots using ggplot2 v3.5.1 in R v4.2.1.</p>
</sec>
<sec id="sec11">
<label>2.9</label>
<title>Cluster analysis</title>
<p>Based on the resistance stratification data, we utilized unsupervised clustering analysis to categorize a collection of 600 strains. To determine the stable number of clusters, we employed the ConsensusClusterPlus22 R package, performing clustering analyses across all groups through 1,000 iterations using the KM hierarchical clustering algorithm. Additionally, we utilized PCA (principal component analysis) to further validate the stability of the classifications. Subsequently, we used the VCF2PCACluster (<xref ref-type="bibr" rid="ref29">He et al., 2024</xref>) to perform PCA and clustering analysis on the SNP (single nucleotide polymorphism) data.</p>
</sec>
<sec id="sec12">
<label>2.10</label>
<title>Muti-gene phylogeny</title>
<p>Coding sequences (CDSs) of 31 resistance genes were individually aligned using MAFFT v7.505 with the --auto parameter in PhyloSuite v1.2.3 (<xref ref-type="bibr" rid="ref70">Zhang et al., 2020</xref>). Poorly aligned regions were trimmed using trimAl v1.4 with the -automated1 heuristic to preserve reliable phylogenetic signal. The trimmed alignments were then concatenated into a super matrix using PhyloSuite&#x2019;s integrated concatenation tool. Optimal partitioning schemes (by gene and codon position) and nucleotide substitution models were determined under the Bayesian information criterion (BIC) using PartitionFinder v2.1.1 (<xref ref-type="bibr" rid="ref37">Lanfear et al., 2017</xref>), employing a greedy search algorithm to evaluate model combinations. Maximum likelihood (ML) phylogenies were reconstructed with IQ-TREE v2.3.4, applying partition-specific substitution models. Topological robustness was assessed via 10,000 ultrafast bootstrap (UFBoot) replicates and by evaluating 100 distinct random starting trees to ensure consistency. Final trees were visualized and annotated in iTOL v6.</p>
</sec>
<sec id="sec13">
<label>2.11</label>
<title>Differential analysis of SNPs</title>
<p>We constructed a matrix of SNPs and refined it meticulously to ensure data accuracy and consistency. During the matrix establishment, we set a criterion: if a mutation occurred at a particular locus within the sample, that locus was labeled as 1; if no mutation occurred, it was labeled as 0. Subsequently, we conducted a comprehensive comparative analysis across different cluster types to identify which SNPs had a mutation rate exceeding 90% in each cluster type and further filtered out SNP loci unique to each category. These filtered loci are referred to as drug-resistant mutation pattern (DRMP).</p>
</sec>
<sec id="sec14">
<label>2.12</label>
<title>Statistical analysis</title>
<p>For statistical analysis and graphical generation, we utilized R Project v4.0.2 (accessible at <ext-link xlink:href="https://www.r-project.org/" ext-link-type="uri">https://www.r-project.org/</ext-link>). In terms of text processing, we employed Perl v5.15 (available at <ext-link xlink:href="https://www.perl.org/" ext-link-type="uri">https://www.perl.org/</ext-link>) and Python v3.10 (accessible at <ext-link xlink:href="https://www.python.org/" ext-link-type="uri">https://www.python.org/</ext-link>). To calculate the correlation between gene mutation bases and amino acid usage and evolutionary rates, we applied the Spearman&#x2019;s rank correlation analysis method. For drawing and beautifying the evolutionary tree, we used iTOL v6 (accessible at <ext-link xlink:href="https://itol.embl.de/" ext-link-type="uri">https://itol.embl.de/</ext-link>) (<xref ref-type="bibr" rid="ref41">Letunic and Bork, 2021</xref>).</p>
</sec>
</sec>
<sec sec-type="results" id="sec15">
<label>3</label>
<title>Results</title>
<sec id="sec16">
<label>3.1</label>
<title>Landscape on the <italic>Mycobacterium tuberculosis</italic> pan-genome</title>
<p>We constructed a comprehensive pan-genome of <italic>M. tuberculosis</italic> by assembling 1,000 complete genomes of this pathogen. Using the IPGA scoring system, we identified that panX exhibited the most optimal performance in the pan-genome analysis of <italic>M. tuberculosis</italic>. The results revealed a striking imbalance in gene distribution: core genes constituted the overwhelming majority (69%) of the total gene complement, while accessory genes accounted for only 31%. This underscores the substantial core genome shared among the analyzed strains (<xref ref-type="fig" rid="fig1">Figure 1A</xref>). Additionally, the number of pan-gene clusters increased to 12,295, whereas the number of core gene clusters decreased to 2,935. Meanwhile, the curve began to plateau with additional strains, indicating that further strain addition had a minimal impact on defining the core genome (<xref ref-type="fig" rid="fig1">Figure 1B</xref>). Upon further statistical analysis of the gene sequence length distribution within the pan-genome, we observed a decrease in the number of genes as the gene length increased. Most genes were found to be under 2,000&#x202F;bp in length. Notably, core genes primarily consisted of shorter sequences (under 1,000&#x202F;bp), resulting in a smoother curve. In contrast, accessory genes were more prevalent among longer sequences (1,500&#x202F;bp), leading to a more fluctuating curve (<xref ref-type="fig" rid="fig1">Figure 1C</xref>). Based on the phylogenetic inference using whole-genome SNPs, we were able to classify these genomes into 16 distinct clusters (<xref ref-type="fig" rid="fig1">Figure 1D</xref>). Furthermore, our analysis of mobile genetic elements involved in constructing the pan-genome revealed that integration/excision (IE) was the most frequently annotated, with 23 occurrences. This was followed by replication/recombination/repair (RRR) (20), phage (P) (9), and stability/transfer/defense (STD) (3), transfer (T) being the least frequent of 2 (<xref ref-type="fig" rid="fig1">Figure 1E</xref>). Overall, we successfully constructed the pan-genome of <italic>M. tuberculosis</italic>, providing valuable insights into its genetic diversity and evolutionary history. This achievement highlights the power of pan-genome analysis in elucidating the complex genomic landscape of infectious diseases.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Pan-genome mapping of <italic>M. tuberculosis</italic>. Proportion of core and accessory genes among <italic>M. tuberculosis</italic> <bold>(A)</bold>, plot of changes in the number of pan- and core gene clusters with the addition of <italic>M. tuberculosis</italic> <bold>(B)</bold>. Distribution of gene sequence lengths in the <italic>M. tuberculosis</italic> pan-genome, x-axis: gene sequence length (bp), y-axis: number of genes <bold>(C)</bold>. Phylogenetic relationships among <italic>M. tuberculosis</italic> strains based on whole-genome variation <bold>(D)</bold>. Spatial distribution of mobile genetic elements in the <italic>M. tuberculosis</italic> pan-genome <bold>(E)</bold>. IE, integration/excision, RRR, replication/recombination/repair; P, phage; STD, stability/transfer/defense; T, transfer.</p>
</caption>
<graphic xlink:href="fmicb-16-1663069-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">A series of five panels showing genomic data: A) A pie chart with 69% core genes and 31% accessory genes. B) A line graph showing the number of gene clusters across genomes, with core and pan genes distinguished. C) A graph of gene count by gene length, with insets for core and accessory genes. D) A circular phylogenetic tree with SNPs and variant depths. E) A circular diagram with gene locations and features marked.Each panel illustrates different aspects of genomic analysis.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec17">
<label>3.2</label>
<title>Pan-genomic variation in <italic>Mycobacterium tuberculosis</italic></title>
<p>To thoroughly investigate the <italic>variation</italic> of <italic>M. tuberculosis</italic>, we conducted an extensive analysis of the distribution of SNPs across the entire genome. Our findings indicate a lack of pronounced mutation hotspots; however, they suggest that genetic diversity arises ubiquitously throughout the genome rather than being concentrated in specific genomic segments (<xref ref-type="fig" rid="fig2">Figure 2A</xref>), upon statistical analysis of all base mutations, it became evident that <italic>M. tuberculosis</italic> exhibits a striking level of conservatism at the nucleotide level, with 98.08% stability observed. Only a minuscule fraction, 2.02% of bases, were found to be mutated. This high degree of genetic stability suggests that most regions of the <italic>M. tuberculosis</italic> genome are under strong selective pressure to maintain function. Among the identified mutations, the transition from cytosine (C) to guanine (G) was the most prevalent, accounting for 25.96% of all mutations. This was followed closely by the transition of guanine (G) to adenine (A), which constituted 24.47% of mutations. In contrast, transversions between adenine (A) and thymine (T) were exceedingly rare, with A to T mutations occurring at a frequency of 0.87% and T to A mutations at 0.88%. This pronounced asymmetry in substitution types highlights a fundamental constraint or bias in the mutagenic processes shaping <italic>M. tuberculosis</italic> evolution (<xref ref-type="fig" rid="fig2">Figure 2B</xref>). To investigate sequence preferences influencing mutagenesis, we generated position-weighted sequence logos centered on each nucleotide (A, C, G, T) with 5-bp flanking contexts. Motif analysis consistently revealed significant enrichment of C/G bases immediately adjacent to mutated sites across all central nucleotides (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.001, Fisher&#x2019;s exact test). This conserved pattern suggests that C/G dinucleotides may facilitate mutagenesis by stabilizing local structural dynamics or recruiting specific protein interactors (<xref ref-type="fig" rid="fig2">Figure 2C</xref>). To elucidate the potential impact of these mutations on protein sequence and function, we statistically analyzed the translational changes subsequent to the mutations. We counted the number of amino acid changes encoded by the mutated sites and discovered that synonymous (63%) and nonsynonymous mutations (37%) occurred in similar proportions in both the positive and negative strands. Within synonymous mutations, the amino acid alanine (Ala) was most frequently unaffected. In the realm of nonsynonymous mutations, valine (Val) was the amino acid most commonly subjected to change. Notably, tryptophan (Trp) exhibited only nonsynonymous mutations, suggesting its critical role in protein structure or function. Additionally, we observed an increase in the number of termination codons resulting from the mutations, which could have significant implications for gene expression and pathogenicity (<xref ref-type="fig" rid="fig2">Figure 2D</xref>). These insights not only enhance our understanding of the genetic diversity and evolution of <italic>M. tuberculosis</italic> but also have important implications for developing targeted therapeutic strategies against this globally significant human pathogen.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Panoramic analysis of variation. Distribution of SNPs and GC content at the pan-genomic level <bold>(A)</bold>. Statistical map of mutant base transitions <bold>(B)</bold>. Motif plots of sequence features for each of the five bases before and after the mutant site are depicted <bold>(C)</bold>. Chart of amino acid change results <bold>(D)</bold>.</p>
</caption>
<graphic xlink:href="fmicb-16-1663069-g002.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Panel A displays a circular plot with genomic tracks for SNPs, GC skew, and GC content. Panel B shows a circular diagram highlighting nucleotide substitution percentages between A, C, G, and T. Panel C presents a sequence logo for nucleotide variations referencing A, C, G, and T. Panel D features a radial chart displaying nonsynonymous and synonymous substitutions, showing counts of amino acids like Val, Ala, and Ser.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec18">
<label>3.3</label>
<title>Drug resistance-related genes of <italic>Mycobacterium tuberculosis</italic></title>
<p>Our comprehensive investigation into genes associated with drug resistance uncovers an intriguing distribution pattern: these genes are dispersed across both the positive and negative strands of the genome. Among them, genes like embB stand out for their capacity to resist multiple drugs. Moreover, our analysis reveals a complex interplay where multiple genes can collaboratively contribute to the resistance against a single drug (<xref ref-type="fig" rid="fig3">Figure 3A</xref>). A pan-genomic examination of these pivotal genes discloses that the majority are classified as core genes, underscoring their fundamental role in the organism&#x2019;s survival. Only two genes, ethA and fabD, were characterized as auxiliary, suggesting a more specialized function (<xref ref-type="fig" rid="fig3">Figure 3B</xref>). The mutation rate among these genes was remarkably low at 1%, with the predominant mutation being a guanine (G) transitioning to adenine (A). This specific G to A mutation was the most frequent, highlighting a potential hotspot for genetic alterations impacting drug resistance. Furthermore, we analyzed the correlation between the types of variant bases and resistance to nine different antimicrobial drugs. Our results revealed a positive correlation between the occurrence of base mutations and the resistance levels observed for these drugs. Interestingly, when evaluating the resistance conferred by different mutated bases, we found that mutations exhibiting the least resistance correlation were those associated with para-aminosalicylic acid (PAS). This implies that PAS remains relatively efficacious even against strains harboring certain mutations, potentially due to the drug&#x2019;s unique mechanism of action or the types of mutations that arise in its presence. In contrast, mutations showing a higher resistance correlation were those associated with pyrazinamide (PZA). These insights into the nuanced relationships between mutated bases and drug resistance have important implications for understanding the evolution of drug-resistant strains. They also emphasize the need for continuous surveillance of mutational patterns to predict and counteract the emergence of resistant phenotypes. Moreover, this information can guide the development of more robust therapeutic strategies that are less susceptible to existing resistance mechanisms, ultimately improving clinical outcomes in the battle against multidrug-resistant infections (<xref ref-type="fig" rid="fig3">Figure 3C</xref>). These findings underscore the diverse mechanisms by which different drugs are rendered ineffective due to genetic changes. This insight not only advances our understanding of drug resistance at the genomic level but also paves the way for more targeted and effective strategies to combat drug-resistant strains.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Analysis of drug resistance-related genes. The circular diagram displays the distribution of drug resistance-related genes and their relationship to the nine drugs. From the outside to the inside, the diagram indicates: drug names, drug resistance-related genes, distribution of SNPs, GC content, positive strand GC content, and negative strand GC content <bold>(A)</bold>. Pie chart shows the distribution of drug resistance-associated genes across the pan-genome <bold>(B)</bold>. Trend chart of mutation base type (middle) and correlation between nine different drug resistances (right) <bold>(C)</bold>. AMI, amikacin; EMB, ethambutol; ETH, ethionamide; FLQ, fluoroquinolones; INH, isoniazid; PAS, para-aminosalicylic acid; PZA, pyrazinamide; RIF, rifampicin; SM, streptomycin.</p>
</caption>
<graphic xlink:href="fmicb-16-1663069-g003.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Diagram showing genomic and drug resistance data for Mycobacterium tuberculosis. Panel A: Circular diagram with tracks for drug resistance regions and genetic content, with labeled genes. Panel B: Pie chart illustrating core genes (29) and accessory genes (2: ethA, fabD). Panel C: Bar chart detailing frequency of nucleotide mutations and heatmap showing drug resistance associations with a color gradient legend from 0 to 1.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec19">
<label>3.4</label>
<title>The relationship between gene mutations and the rate of gene evolution</title>
<p>The dynamics of gene mutations significantly influence the evolutionary trajectory of protein sequences. These evolutionary changes typically encompass the acquisition and deletion of amino acids (AAs), which can profoundly affect protein function and structural stability. In our study, we conducted an in-depth analysis of the AA variations encoded by genes associated with drug resistance. Our study findings reveal that, among the resistance genes examined, the proportion of the AA variant is significantly higher than other types, notably, alanine (Ala), valine (Val), serine (Ser), arginine (Arg), and threonine (Thr) were high variability, suggesting a possible correlation between the frequency of these residues and the adaptive advantage conferred by resistance genes. Conversely, our analysis also identified a set of AAs that appear to be more stable in these genes. Including Trp, phenylalanine (Phe), methionine (Met), lysine (Lys), and cysteine (Cys) (<xref ref-type="fig" rid="fig4">Figure 4A</xref>). This divergence in AA usage may reflect functional constraints or selective pressures unique to the resistant phenotypes. To explore the impact of mutations on the evolutionary rate of genes, we examined the ratio of nonsynonymous (<italic>K</italic><sub>a</sub>) to synonymous (<italic>K</italic><sub>s</sub>) substitutions, a metric commonly used to infer selection pressures acting on protein-coding genes. Strikingly, we observed varied <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub> ratios across different resistance genes, indicating heterogeneity in their evolutionary trajectories. Remarkably, the majority of the resistance genes exhibited signatures of positive selection, indicated by <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub> ratios greater than 1. This pattern suggests that these genes are evolving under pressures that favor new variants, potentially due to environmental challenges such as exposure to antimicrobial agents. In stark contrast, only two genes, tlyA and embC, showed signs of purifying selection with <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub> ratios of 0.3 and 0.26, respectively (<xref ref-type="fig" rid="fig4">Figure 4B</xref>). Purifying selection, characterized by <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub> ratios less than 1, operates to remove deleterious variants from the population, implying that most mutations in these genes are likely to be harmful and thus eliminated over time. Taken together, these results provide compelling evidence that the evolution of drug resistance in bacterial populations is a complex process influenced by both the accumulation of advantageous mutations and the elimination of detrimental ones. This deeper understanding of genetic variation and its impact on evolutionary dynamics can inform strategies to mitigate the spread of antimicrobial resistance.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>Correlation between gene mutation and gene evolutionary rate. The histogram displays the changes in amino acid (AA) usage frequency of nine drug resistance-related genes caused by gene mutations. The five most frequently used AAs are marked in red on the right, while the five least frequently used AAs are indicated in light green on the left <bold>(A)</bold>. Density plot of the rate of evolution of resistance genes (<italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub> ratio), the lines represent the corresponding genes, with the values indicating the median. <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub>&#x202F;&#x003E;&#x202F;1 indicates that the gene is under positive selection, <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub>&#x202F;=&#x202F;1 suggests neutral evolution of the gene, and <italic>K</italic><sub>a</sub>/<italic>K</italic><sub>s</sub>&#x202F;&#x003C;&#x202F;1 implies that the gene is undergoing purifying selection <bold>(B)</bold>.</p>
</caption>
<graphic xlink:href="fmicb-16-1663069-g004.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Composite image with two sections: (A) A bar graph showing frequency distribution of genetic gains and losses across amino acids, with different drugs represented by color-coded bars. (B) Density plots for each drug, displaying ka/ks ratios for specific genes, labeled with gene names and values, in color-coded panels corresponding to the drugs.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec20">
<label>3.5</label>
<title>Cluster analysis of <italic>Mycobacterium tuberculosis</italic></title>
<p>To elucidate the relationship between genetic mutations and drug responses, we conducted an extensive cluster analysis involving 1,140 strains. Utilizing tolerance scores against nine antimicrobial drugs, we discerned three prominent clustering groups through a rigorous examination of internal consistency and clustering effects. This classification was further validated by PCA, which distinctly separated the strains into three coherent groups on the PCA plot (<xref ref-type="fig" rid="fig5">Figure 5A</xref>). Intriguingly, when we applied PCA to investigate the association between these drugs and SNPs, a similar pattern emerged. The SNPs were broadly clustered into three subgroups on the PCA plot, suggesting a potential correlation between genetic variations and phenotypic drug responses (<xref ref-type="fig" rid="fig5">Figure 5B</xref>). Phylogenetic reconstruction based on multiple genes recapitulated the population structure observed in principal component analysis (PCA) and further demonstrated that allele-specific drug effects were closely aligned with SNP-based clustering patterns (<xref ref-type="fig" rid="fig5">Figure 5C</xref>). We presented the drug resistance characteristics of each sample through a heatmap of drug resistance. From early evolutionary stages lacking drug resistance, through intermediate stages where diverse resistance mechanisms emerged, to late stages where resistance stabilized, significant differences in drug resistance existed across clusters. By leveraging these genetic constraints, we established drug-resistance mutation profiles (DRMPs) through the analysis of SNPs within each cluster and identification of those unique to specific clusters. Critically, these DRMPs serve as precise molecular signatures that enable the selection of optimal, cluster-specific drug regimens. This approach facilitates targeted therapy, whether using single agents or tailored drug combinations, thereby maximizing treatment efficacy for distinct <italic>M. tuberculosis</italic> populations (<xref ref-type="fig" rid="fig5">Figures 5C</xref>, <xref ref-type="fig" rid="fig6">6</xref>). These analyses underscore the intricate interplay between genetic diversity and drug response, highlighting the potential of customized treatment approaches based on the molecular fingerprints of bacterial strains.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Clustering analysis of <italic>M. tuberculosis</italic> strains. PCA clustering of drug resistance score <bold>(A)</bold> and SNPs <bold>(B)</bold>. The cluster evolutionary tree, the outer circle is a resistance distribution map of nine drugs, and the inner layer is the evolutionary tree itself, with colors showing different cluster groups <bold>(C)</bold>.</p>
</caption>
<graphic xlink:href="fmicb-16-1663069-g005.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Scatter plots and a circular dendrogram illustrate clusters related to drug resistance and SNPs. Panel A shows clusters marked A, B, and C in green, blue, and red, respectively, based on principal components. Panel B displays SNP clusters with similar color coding. Panel C features a circular dendrogram with branches and rings denoting therapeutic drug resistance scores, ranging from no resistance in blue to maximum resistance in red, for drugs AMI, EMB, ETH, FLQ, INH, PAS, PZA, RIF, and SM.</alt-text>
</graphic>
</fig>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption>
<p>Diagram of <italic>M. tuberculosis</italic> DRMP, with evolutionary levels increasing from bottom to top. Each small circle in the diagram represents an anti-tuberculosis drug, while the drugs enclosed in boxes denote the corresponding therapeutic levels that can be applied. The variant sites in the genes shown are the DRMP. The bases include the alternate allele (Alt) and the reference allele (Ref). The numbers indicate the base positions (Pos) on the gene.</p>
</caption>
<graphic xlink:href="fmicb-16-1663069-g006.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Diagram illustrating bacterial gene mutations and their relation to drug resistance. It shows genetic sequences with mutations at specific loci, connecting to therapeutic drugs. Colored spheres represent different drugs, each labeled in a legend: AMI, EMB, ETH, FLQ, INH, PAS, PZA, RIF, SM. Paths indicate how different mutations correlate to drug resistance.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="sec21">
<label>4</label>
<title>Discussion</title>
<p>The genetic diversity exhibited by <italic>M. tuberculosis</italic> is a key driver of the emergence of clinical multidrug resistance (<xref ref-type="bibr" rid="ref32">Jia et al., 2017</xref>; <xref ref-type="bibr" rid="ref49">Napier et al., 2020</xref>; <xref ref-type="bibr" rid="ref57">Shaku and Bishai, 2022</xref>), a problem that has long confounded anti-tuberculosis treatment (<xref ref-type="bibr" rid="ref22">Farhat et al., 2024</xref>; <xref ref-type="bibr" rid="ref60">Shu and Liu, 2024</xref>). In this study, we employed pan-genomic analysis methods to comprehensively explore the relationship between the evolutionary characteristics of <italic>M. tuberculosis</italic> and its drug resistance, thereby elucidating specific patterns of drug-resistant mutations. These findings provide clearer guidance for the future development of antimicrobial drugs and clinical treatment.</p>
<p>We analyzed over 1,000 <italic>M. tuberculosis</italic> strains from various sources with diverse resistance profiles collected over the past 15&#x202F;years, examining the diversity in genetic evolution and its correlation with drug-resistant gene mutations. We identified 31 main drug-resistant genes, 94% of which are attributed to the core genes (<xref ref-type="fig" rid="fig3">Figure 3</xref>). Further analysis revealed a preference for base mutations closely associated with nonsynonymous mutations at resistance sites, reflecting the adaptive changes in bacteria under drug pressure over the years. These results not only offer new perspectives on the drug-resistant mechanisms of <italic>M. tuberculosis</italic> but also provide a crucial molecular foundation for addressing drug-resistant tuberculosis.</p>
<p>The study shows that starting from drug-sensitive strains, AMI and fluoroquinolones (FLQ) resistance emerged first, followed by cumulative mutations in INH, rifampicin (RIF), and streptomycin (SM) (<xref ref-type="fig" rid="fig5">Figure 5C</xref>), indicating more than just simple cross-resistance reported previously. The analysis of evolutionary rates of drug-resistant genes suggests that although most target genes underwent positive selection (<xref ref-type="fig" rid="fig4">Figure 4</xref>), such as PAS-targeted thyA; SM-targeted rpsL, gid; and INH-targeted multiple genes, the structural diversity of these target proteins had minimal impact on their function. This provides opportunities for drug-resistant mutations. Interestingly, the tlyA gene under AMI influence underwent passive selection, indicating its conservation and potential lethality of mutations, suggesting that drug target selection should focus on more conserved proteins to minimize resistance. Thus, developing new drugs against resistant strains targeting the tlyA gene remains promising.</p>
<p>Since conventional treatment outcomes are often poor due to variant strains of <italic>M. tuberculosis</italic> (<xref ref-type="bibr" rid="ref31">Jang and Chung, 2020</xref>; <xref ref-type="bibr" rid="ref49">Napier et al., 2020</xref>), revising clinical treatment plans and selecting drugs against drug-resistant strains require identification and evaluation of prevalent bacterial strains (<xref ref-type="bibr" rid="ref21">Escalante et al., 1998</xref>; <xref ref-type="bibr" rid="ref38">Lavender et al., 2005</xref>; <xref ref-type="bibr" rid="ref61">Singh et al., 2020</xref>). Previously, this was determined primarily through phenotypic drug susceptibility testing, which involves cumbersome liquid culture screening in microplates and has a long turnaround time. Consequently, the industry has proposed using molecular drug susceptibility to assess and select treatment methods, necessitating a deep understanding of drug-resistant mutation patterns (<xref ref-type="bibr" rid="ref16">Dom&#x00ED;nguez et al., 2023</xref>). Although recent studies have used SNP detection methods to assess the drug resistance of <italic>M. tuberculosis</italic>, these mainly focused on single-drug resistance testing (<xref ref-type="bibr" rid="ref2">Allix-B&#x00E9;guec et al., 2018</xref>; <xref ref-type="bibr" rid="ref16">Dom&#x00ED;nguez et al., 2023</xref>). For example, linear probe assays like GenoType MTBDRsl VER 2.0 and cartridge-based methods like Xpert MTB/XDR detect fluoroquinolone resistance (<xref ref-type="bibr" rid="ref9">Cao et al., 2021</xref>), and Nipro Genoscholar PZA-TB II focuses on the detection of pncA gene mutations related to PZA resistance (<xref ref-type="bibr" rid="ref17">Driesen et al., 2018</xref>; <xref ref-type="bibr" rid="ref67">Willby et al., 2018</xref>). However, these methods fall short in comprehensiveness and systematicity. Part of this is due to background noise from random genetic drift, and another part is because drug resistance often results from combined mutations across multiple genes and sites (<xref ref-type="bibr" rid="ref1">Ahmad et al., 2016</xref>; <xref ref-type="bibr" rid="ref11">Chen et al., 2023</xref>; <xref ref-type="bibr" rid="ref16">Dom&#x00ED;nguez et al., 2023</xref>). Additionally, different drug sensitivity testing (DST) methods may lead to the emergence of discrepant results among isolates (<xref ref-type="bibr" rid="ref53">Qadir et al., 2024</xref>), which increases the difficulty of fully understanding mutation patterns and evaluating unknown variant strains. Comparative studies on evolutionary patterns under polypharmacy pressure over extended periods can clarify strain characteristics, enabling a more comprehensive drug-resistant assessment of all variant strains (<xref ref-type="bibr" rid="ref3">Arnold et al., 2022</xref>). Therefore, to provide detailed data support for future molecular drug susceptibility diagnostics, our study reveals the interplay between diversity and drug pressure selection through pan-genome PCA and clustering analysis (<xref ref-type="fig" rid="fig5">Figure 5</xref>), and establishes a link between genetic variation and drug-resistant phenotypes based on SNPs differences (<xref ref-type="fig" rid="fig6">Figure 6</xref>). This locks in the DRMP, serving as a molecular fingerprint and precise molecular drug susceptibility indicator for resistant strains, aiding in the evaluation of resistant conditions in variant strains (including unknown ones) and determining optimal treatment options, thus facilitating the implementation of precision personalized treatment. Beyond direct diagnosis and treatment guidance, DRMP characterization offers significant clinical and epidemiological value. Clinically, specific mutation patterns may predict resistance-associated fitness costs, influencing <italic>M. tuberculosis</italic> transmissibility and relapse risk. This enables patient stratification for enhanced follow-up or infection control. Epidemiologically, DRMP act as molecular fingerprints for tracking transmission. Clusters sharing rare DRMP signal local outbreaks, while geographically distinct patterns reveal cross-border spread. Pan-genomic DRMP analysis identifies regionally prevalent resistance mechanisms, exposing gaps in local drug regulation or prescribing practices. These insights prioritize targeted surveillance, optimize resource allocation for containment, and inform early-warning systems for emerging threats.</p>
<p>In summary, this study adopts a pan-genomic perspective to comprehensively analyze the correlation between the evolution of <italic>M. tuberculosis</italic> and its drug resistance. The findings suggest that developing new antibiotics targeting certain key and conserved genes can enhance drug sensitivity and decrease the possibility of drug resistance. Moreover, the research reveals a close association between the clustering of SNPs in clinical strains and drug-resistant characteristics, and identifies specific DRMP. This DRMP can serve as precise molecular markers for drug susceptibility, guiding the selection of effective medications and thereby providing personalized treatment options for clinical therapy.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec22">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref rid="SM1" ref-type="supplementary-material">Supplementary material</xref>, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec sec-type="author-contributions" id="sec23">
<title>Author contributions</title>
<p>XS: Data curation, Software, Visualization, Writing &#x2013; original draft. PX: Data curation, Methodology, Software, Validation, Writing &#x2013; original draft. YS: Investigation, Methodology, Project administration, Writing &#x2013; original draft. NW: Conceptualization, Methodology, Software, Writing &#x2013; original draft. YL: Conceptualization, Formal analysis, Methodology, Project administration, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="funding-information" id="sec24">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research and/or publication of this article.</p>
</sec>
<sec sec-type="COI-statement" id="sec25">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec26">
<title>Generative AI statement</title>
<p>The authors declare that no Gen AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec27">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec28">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2025.1663069/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fmicb.2025.1663069/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<fn-group>
<fn id="fn0001"><p><sup>1</sup><ext-link xlink:href="https://www.ncbi.nlm.nih.gov/sra" ext-link-type="uri">https://www.ncbi.nlm.nih.gov/sra</ext-link></p></fn>
<fn id="fn0002"><p><sup>2</sup><ext-link xlink:href="https://www.ncbi.nlm.nih.gov/datasets/genome/?taxon=1773" ext-link-type="uri">https://www.ncbi.nlm.nih.gov/datasets/genome/?taxon=1773</ext-link></p></fn>
<fn id="fn0003"><p><sup>3</sup><ext-link xlink:href="https://busco-data.ezlab.org/v5/data/lineages/" ext-link-type="uri">https://busco-data.ezlab.org/v5/data/lineages/</ext-link></p></fn>
<fn id="fn0004"><p><sup>4</sup><ext-link xlink:href="https://github.com/dbespiatykh/TB-gen" ext-link-type="uri">https://github.com/dbespiatykh/TB-gen</ext-link></p></fn>
<fn id="fn0005"><p><sup>5</sup><ext-link xlink:href="https://github.com/Ankitapal1995/TB-AMRpred" ext-link-type="uri">https://github.com/Ankitapal1995/TB-AMRpred</ext-link></p></fn>
<fn id="fn0006"><p><sup>6</sup><ext-link xlink:href="https://github.com/avkitex/tbAnnotator" ext-link-type="uri">https://github.com/avkitex/tbAnnotator</ext-link></p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ahmad</surname><given-names>S.</given-names></name> <name><surname>Mokaddas</surname><given-names>E.</given-names></name> <name><surname>Al-Mutairi</surname><given-names>N.</given-names></name> <name><surname>Eldeen</surname><given-names>H. S.</given-names></name> <name><surname>Mohammadi</surname><given-names>S.</given-names></name></person-group> (<year>2016</year>). <article-title>Discordance across phenotypic and molecular methods for drug susceptibility testing of drug-resistant <italic>Mycobacterium tuberculosis</italic> isolates in a low TB incidence country</article-title>. <source>PLoS One</source> <volume>11</volume>:<fpage>e0153563</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0153563</pub-id>, PMID: <pub-id pub-id-type="pmid">27096759</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Allix-B&#x00E9;guec</surname><given-names>C.</given-names></name> <name><surname>Arandjelovic</surname><given-names>I.</given-names></name> <name><surname>Bi</surname><given-names>L.</given-names></name> <name><surname>Beckert</surname><given-names>P.</given-names></name> <name><surname>Bonnet</surname><given-names>M.</given-names></name> <name><surname>Bradley</surname><given-names>P.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Prediction of susceptibility to first-line tuberculosis drugs by DNA sequencing</article-title>. <source>N. Engl. J. Med.</source> <volume>379</volume>, <fpage>1403</fpage>&#x2013;<lpage>1415</lpage>. doi: <pub-id pub-id-type="doi">10.1056/NEJMoa1800474</pub-id>, PMID: <pub-id pub-id-type="pmid">30280646</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arnold</surname><given-names>B. J.</given-names></name> <name><surname>Huang</surname><given-names>I. T.</given-names></name> <name><surname>Hanage</surname><given-names>W. P.</given-names></name></person-group> (<year>2022</year>). <article-title>Horizontal gene transfer and adaptive evolution in bacteria</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>20</volume>, <fpage>206</fpage>&#x2013;<lpage>218</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41579-021-00650-4</pub-id>, PMID: <pub-id pub-id-type="pmid">34773098</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aubry</surname><given-names>A.</given-names></name> <name><surname>Veziris</surname><given-names>N.</given-names></name> <name><surname>Cambau</surname><given-names>E.</given-names></name> <name><surname>Truffot-Pernot</surname><given-names>C.</given-names></name> <name><surname>Jarlier</surname><given-names>V.</given-names></name> <name><surname>Fisher</surname><given-names>L. M.</given-names></name></person-group> (<year>2006</year>). <article-title>Novel gyrase mutations in quinolone-resistant and -hypersusceptible clinical isolates of <italic>Mycobacterium tuberculosis</italic>: functional analysis of mutant enzymes</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>50</volume>, <fpage>104</fpage>&#x2013;<lpage>112</lpage>. doi: <pub-id pub-id-type="doi">10.1128/aac.50.1.104-112.2006</pub-id>, PMID: <pub-id pub-id-type="pmid">16377674</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bertels</surname><given-names>F.</given-names></name> <name><surname>Silander</surname><given-names>O. K.</given-names></name> <name><surname>Pachkov</surname><given-names>M.</given-names></name> <name><surname>Rainey</surname><given-names>P. B.</given-names></name> <name><surname>van Nimwegen</surname><given-names>E.</given-names></name></person-group> (<year>2014</year>). <article-title>Automated reconstruction of whole-genome phylogenies from short-sequence reads</article-title>. <source>Mol. Biol. Evol.</source> <volume>31</volume>, <fpage>1077</fpage>&#x2013;<lpage>1088</lpage>. doi: <pub-id pub-id-type="doi">10.1093/molbev/msu088</pub-id>, PMID: <pub-id pub-id-type="pmid">24600054</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bolger</surname><given-names>A. M.</given-names></name> <name><surname>Lohse</surname><given-names>M.</given-names></name> <name><surname>Usadel</surname><given-names>B.</given-names></name></person-group> (<year>2014</year>). <article-title>Trimmomatic: a flexible trimmer for Illumina sequence data</article-title>. <source>Bioinformatics</source> <volume>30</volume>, <fpage>2114</fpage>&#x2013;<lpage>2120</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btu170</pub-id>, PMID: <pub-id pub-id-type="pmid">24695404</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brown</surname><given-names>C. L.</given-names></name> <name><surname>Mullet</surname><given-names>J.</given-names></name> <name><surname>Hindi</surname><given-names>F.</given-names></name> <name><surname>Stoll</surname><given-names>J. E.</given-names></name> <name><surname>Gupta</surname><given-names>S.</given-names></name> <name><surname>Choi</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>mobileOG-db: a manually curated database of protein families mediating the life cycle of bacterial mobile genetic elements</article-title>. <source>Appl. Environ. Microbiol.</source> <volume>88</volume>:<fpage>e0099122</fpage>. doi: <pub-id pub-id-type="doi">10.1128/aem.00991-22</pub-id>, PMID: <pub-id pub-id-type="pmid">36036594</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Camacho</surname><given-names>C.</given-names></name> <name><surname>Coulouris</surname><given-names>G.</given-names></name> <name><surname>Avagyan</surname><given-names>V.</given-names></name> <name><surname>Ma</surname><given-names>N.</given-names></name> <name><surname>Papadopoulos</surname><given-names>J.</given-names></name> <name><surname>Bealer</surname><given-names>K.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>BLAST+: architecture and applications</article-title>. <source>BMC Bioinformatics</source> <volume>10</volume>:<fpage>421</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2105-10-421</pub-id>, PMID: <pub-id pub-id-type="pmid">20003500</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cao</surname><given-names>Y.</given-names></name> <name><surname>Parmar</surname><given-names>H.</given-names></name> <name><surname>Gaur</surname><given-names>R. L.</given-names></name> <name><surname>Lieu</surname><given-names>D.</given-names></name> <name><surname>Raghunath</surname><given-names>S.</given-names></name> <name><surname>Via</surname><given-names>N.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Xpert MTB/XDR: a 10-color reflex assay suitable for point-of-care settings to detect isoniazid, fluoroquinolone, and second-line-injectable-drug resistance directly from <italic>Mycobacterium tuberculosis</italic>-positive sputum</article-title>. <source>J. Clin. Microbiol.</source> <volume>59</volume>:<fpage>e02314-20</fpage>. doi: <pub-id pub-id-type="doi">10.1128/jcm.02314-20</pub-id>, PMID: <pub-id pub-id-type="pmid">33298611</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Capella-Guti&#x00E9;rrez</surname><given-names>S.</given-names></name> <name><surname>Silla-Mart&#x00ED;nez</surname><given-names>J. M.</given-names></name> <name><surname>Gabald&#x00F3;n</surname><given-names>T.</given-names></name></person-group> (<year>2009</year>). <article-title>trimAl: a tool for automated alignment trimming in large-scale phylogenetic analyses</article-title>. <source>Bioinformatics</source> <volume>25</volume>, <fpage>1972</fpage>&#x2013;<lpage>1973</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btp348</pub-id>, PMID: <pub-id pub-id-type="pmid">19505945</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>Y.</given-names></name> <name><surname>Takiff</surname><given-names>H. E.</given-names></name> <name><surname>Gao</surname><given-names>Q.</given-names></name></person-group> (<year>2023</year>). <article-title>Phenotypic instability of <italic>Mycobacterium tuberculosis</italic> strains harbouring clinically prevalent drug-resistant mutations</article-title>. <source>Lancet Microbe</source> <volume>4</volume>:<fpage>e292</fpage>. doi: <pub-id pub-id-type="doi">10.1016/s2666-5247(23)00007-1</pub-id>, PMID: <pub-id pub-id-type="pmid">36716755</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cohen</surname><given-names>K. A.</given-names></name> <name><surname>Abeel</surname><given-names>T.</given-names></name> <name><surname>Manson McGuire</surname><given-names>A.</given-names></name> <name><surname>Desjardins</surname><given-names>C. A.</given-names></name> <name><surname>Munsamy</surname><given-names>V.</given-names></name> <name><surname>Shea</surname><given-names>T. P.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Evolution of extensively drug-resistant tuberculosis over four decades: whole genome sequencing and dating analysis of <italic>Mycobacterium tuberculosis</italic> isolates from KwaZulu-Natal</article-title>. <source>PLoS Med.</source> <volume>12</volume>:<fpage>e1001880</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pmed.1001880</pub-id>, PMID: <pub-id pub-id-type="pmid">26418737</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Danecek</surname><given-names>P.</given-names></name> <name><surname>Bonfield</surname><given-names>J. K.</given-names></name> <name><surname>Liddle</surname><given-names>J.</given-names></name> <name><surname>Marshall</surname><given-names>J.</given-names></name> <name><surname>Ohan</surname><given-names>V.</given-names></name> <name><surname>Pollard</surname><given-names>M. O.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Twelve years of SAMtools and BCFtools</article-title>. <source>GigaScience</source> <volume>10</volume>:<fpage>giab008</fpage>. doi: <pub-id pub-id-type="doi">10.1093/gigascience/giab008</pub-id>, PMID: <pub-id pub-id-type="pmid">33590861</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dheda</surname><given-names>K.</given-names></name> <name><surname>Gumbo</surname><given-names>T.</given-names></name> <name><surname>Gandhi</surname><given-names>N. R.</given-names></name> <name><surname>Murray</surname><given-names>M.</given-names></name> <name><surname>Theron</surname><given-names>G.</given-names></name> <name><surname>Udwadia</surname><given-names>Z.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Global control of tuberculosis: from extensively drug-resistant to untreatable tuberculosis</article-title>. <source>Lancet Respir. Med.</source> <volume>2</volume>, <fpage>321</fpage>&#x2013;<lpage>338</lpage>. doi: <pub-id pub-id-type="doi">10.1016/s2213-2600(14)70031-1</pub-id>, PMID: <pub-id pub-id-type="pmid">24717628</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ding</surname><given-names>W.</given-names></name> <name><surname>Baumdicker</surname><given-names>F.</given-names></name> <name><surname>Neher</surname><given-names>R. A.</given-names></name></person-group> (<year>2017</year>). <article-title>panX: pan-genome analysis and exploration</article-title>. <source>Nucleic Acids Res.</source> <volume>46</volume>:<fpage>e5</fpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkx977</pub-id>, PMID: <pub-id pub-id-type="pmid">29077859</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dom&#x00ED;nguez</surname><given-names>J.</given-names></name> <name><surname>Boeree</surname><given-names>M. J.</given-names></name> <name><surname>Cambau</surname><given-names>E.</given-names></name> <name><surname>Chesov</surname><given-names>D.</given-names></name> <name><surname>Conradie</surname><given-names>F.</given-names></name> <name><surname>Cox</surname><given-names>V.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Clinical implications of molecular drug resistance testing for <italic>Mycobacterium tuberculosis</italic>: a 2023 TBnet/RESIST-TB consensus statement</article-title>. <source>Lancet Infect. Dis.</source> <volume>23</volume>, <fpage>e122</fpage>&#x2013;<lpage>e137</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S1473-3099(22)00875-1</pub-id>, PMID: <pub-id pub-id-type="pmid">36868253</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Driesen</surname><given-names>M.</given-names></name> <name><surname>Kondo</surname><given-names>Y.</given-names></name> <name><surname>de Jong</surname><given-names>B. C.</given-names></name> <name><surname>Torrea</surname><given-names>G.</given-names></name> <name><surname>Asnong</surname><given-names>S.</given-names></name> <name><surname>Desmaretz</surname><given-names>C.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Evaluation of a novel line probe assay to detect resistance to pyrazinamide, a key drug used for tuberculosis treatment</article-title>. <source>Clin. Microbiol. Infect.</source> <volume>24</volume>, <fpage>60</fpage>&#x2013;<lpage>64</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cmi.2017.05.026</pub-id>, PMID: <pub-id pub-id-type="pmid">28587904</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ehrt</surname><given-names>S.</given-names></name> <name><surname>Schnappinger</surname><given-names>D.</given-names></name> <name><surname>Rhee</surname><given-names>K. Y.</given-names></name></person-group> (<year>2018</year>). <article-title>Metabolic principles of persistence and pathogenicity in <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Nat. Rev. Microbiol.</source> <volume>16</volume>, <fpage>496</fpage>&#x2013;<lpage>507</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41579-018-0013-4</pub-id>, PMID: <pub-id pub-id-type="pmid">29691481</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eldholm</surname><given-names>V.</given-names></name> <name><surname>Norheim</surname><given-names>G.</given-names></name> <name><surname>von der Lippe</surname><given-names>B.</given-names></name> <name><surname>Kinander</surname><given-names>W.</given-names></name> <name><surname>Dahle</surname><given-names>U. R.</given-names></name> <name><surname>Caugant</surname><given-names>D. A.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Evolution of extensively drug-resistant <italic>Mycobacterium tuberculosis</italic> from a susceptible ancestor in a single patient</article-title>. <source>Genome Biol.</source> <volume>15</volume>:<fpage>490</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13059-014-0490-3</pub-id>, PMID: <pub-id pub-id-type="pmid">25418686</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Emms</surname><given-names>D. M.</given-names></name> <name><surname>Kelly</surname><given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>OrthoFinder: solving fundamental biases in whole genome comparisons dramatically improves orthogroup inference accuracy</article-title>. <source>Genome Biol.</source> <volume>16</volume>:<fpage>157</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13059-015-0721-2</pub-id>, PMID: <pub-id pub-id-type="pmid">26243257</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Escalante</surname><given-names>P.</given-names></name> <name><surname>Ramaswamy</surname><given-names>S.</given-names></name> <name><surname>Sanabria</surname><given-names>H.</given-names></name> <name><surname>Soini</surname><given-names>H.</given-names></name> <name><surname>Pan</surname><given-names>X.</given-names></name> <name><surname>Valiente-Castillo</surname><given-names>O.</given-names></name> <etal/></person-group>. (<year>1998</year>). <article-title>Genotypic characterization of drug-resistant <italic>Mycobacterium tuberculosis</italic> isolates from Peru</article-title>. <source>Tuberc. Lung Dis.</source> <volume>79</volume>, <fpage>111</fpage>&#x2013;<lpage>118</lpage>. doi: <pub-id pub-id-type="doi">10.1054/tuld.1998.0013</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Farhat</surname><given-names>M.</given-names></name> <name><surname>Cox</surname><given-names>H.</given-names></name> <name><surname>Ghanem</surname><given-names>M.</given-names></name> <name><surname>Denkinger</surname><given-names>C. M.</given-names></name> <name><surname>Rodrigues</surname><given-names>C.</given-names></name> <name><surname>Abd El Aziz</surname><given-names>M. S.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Drug-resistant tuberculosis: a persistent global health concern</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>22</volume>, <fpage>617</fpage>&#x2013;<lpage>635</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41579-024-01025-1</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Finn</surname><given-names>R. D.</given-names></name> <name><surname>Clements</surname><given-names>J.</given-names></name> <name><surname>Eddy</surname><given-names>S. R.</given-names></name></person-group> (<year>2011</year>). <article-title>HMMER web server: interactive sequence similarity searching</article-title>. <source>Nucleic Acids Res.</source> <volume>39</volume>, <fpage>W29</fpage>&#x2013;<lpage>W37</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkr367</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gagneux</surname><given-names>S.</given-names></name></person-group> (<year>2018</year>). <article-title>Ecology and evolution of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Nat. Rev. Microbiol.</source> <volume>16</volume>, <fpage>202</fpage>&#x2013;<lpage>213</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrmicro.2018.8</pub-id>, PMID: <pub-id pub-id-type="pmid">29456241</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gandhi</surname><given-names>N. R.</given-names></name> <name><surname>Nunn</surname><given-names>P.</given-names></name> <name><surname>Dheda</surname><given-names>K.</given-names></name> <name><surname>Schaaf</surname><given-names>H. S.</given-names></name> <name><surname>Zignol</surname><given-names>M.</given-names></name> <name><surname>van Soolingen</surname><given-names>D.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Multidrug-resistant and extensively drug-resistant tuberculosis: a threat to global control of tuberculosis</article-title>. <source>Lancet</source> <volume>375</volume>, <fpage>1830</fpage>&#x2013;<lpage>1843</lpage>. doi: <pub-id pub-id-type="doi">10.1016/s0140-6736(10)60410-2</pub-id>, PMID: <pub-id pub-id-type="pmid">20488523</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gautreau</surname><given-names>G.</given-names></name> <name><surname>Bazin</surname><given-names>A.</given-names></name> <name><surname>Gachet</surname><given-names>M.</given-names></name> <name><surname>Planel</surname><given-names>R.</given-names></name> <name><surname>Burlot</surname><given-names>L.</given-names></name> <name><surname>Dubois</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>PPanGGOLiN: depicting microbial diversity via a partitioned pangenome graph</article-title>. <source>PLoS Comput. Biol.</source> <volume>16</volume>:<fpage>e1007732</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pcbi.1007732</pub-id>, PMID: <pub-id pub-id-type="pmid">32191703</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grant</surname><given-names>J. R.</given-names></name> <name><surname>Enns</surname><given-names>E.</given-names></name> <name><surname>Marinier</surname><given-names>E.</given-names></name> <name><surname>Mandal</surname><given-names>A.</given-names></name> <name><surname>Herman</surname><given-names>E. K.</given-names></name> <name><surname>Chen</surname><given-names>C. Y.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Proksee: in-depth characterization and visualization of bacterial genomes</article-title>. <source>Nucleic Acids Res.</source> <volume>51</volume>, <fpage>W484</fpage>&#x2013;<lpage>W492</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkad326</pub-id>, PMID: <pub-id pub-id-type="pmid">37140037</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hanif</surname><given-names>M.</given-names></name> <name><surname>Arora</surname><given-names>V. K.</given-names></name></person-group> (<year>2022</year>). <article-title><italic>Mycobacterium tuberculosis</italic> next-generation whole genome sequencing</article-title>. <source>Indian J. Tuberc.</source> <volume>69</volume>, <fpage>123</fpage>&#x2013;<lpage>124</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ijtb.2022.03.010</pub-id>, PMID: <pub-id pub-id-type="pmid">35379388</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>He</surname><given-names>W.</given-names></name> <name><surname>Xu</surname><given-names>L.</given-names></name> <name><surname>Wang</surname><given-names>J.</given-names></name> <name><surname>Yue</surname><given-names>Z.</given-names></name> <name><surname>Jing</surname><given-names>Y.</given-names></name> <name><surname>Tai</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>VCF2PCACluster: a simple, fast and memory-efficient tool for principal component analysis of tens of millions of SNPs</article-title>. <source>BMC Bioinformatics</source> <volume>25</volume>:<fpage>173</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12859-024-05770-1</pub-id>, PMID: <pub-id pub-id-type="pmid">38693489</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Inman</surname><given-names>J. M.</given-names></name> <name><surname>Sutton</surname><given-names>G. G.</given-names></name> <name><surname>Beck</surname><given-names>E.</given-names></name> <name><surname>Brinkac</surname><given-names>L. M.</given-names></name> <name><surname>Clarke</surname><given-names>T. H.</given-names></name> <name><surname>Fouts</surname><given-names>D. E.</given-names></name></person-group> (<year>2019</year>). <article-title>Large-scale comparative analysis of microbial pan-genomes using PanOCT</article-title>. <source>Bioinformatics</source> <volume>35</volume>, <fpage>1049</fpage>&#x2013;<lpage>1050</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/bty744</pub-id>, PMID: <pub-id pub-id-type="pmid">30165579</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jang</surname><given-names>J. G.</given-names></name> <name><surname>Chung</surname><given-names>J. H.</given-names></name></person-group> (<year>2020</year>). <article-title>Diagnosis and treatment of multidrug-resistant tuberculosis</article-title>. <source>Yeungnam Univ. J. Med.</source> <volume>37</volume>, <fpage>277</fpage>&#x2013;<lpage>285</lpage>. doi: <pub-id pub-id-type="doi">10.12701/yujm.2020.00626</pub-id>, PMID: <pub-id pub-id-type="pmid">32883054</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jia</surname><given-names>X.</given-names></name> <name><surname>Yang</surname><given-names>L.</given-names></name> <name><surname>Dong</surname><given-names>M.</given-names></name> <name><surname>Chen</surname><given-names>S.</given-names></name> <name><surname>Lv</surname><given-names>L.</given-names></name> <name><surname>Cao</surname><given-names>D.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>The bioinformatics analysis of comparative genomics of <italic>Mycobacterium tuberculosis</italic> complex (MTBC) provides insight into dissimilarities between intraspecific groups differing in host association, virulence, and epitope diversity</article-title>. <source>Front. Cell. Infect. Microbiol.</source> <volume>7</volume>:<fpage>88</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fcimb.2017.00088</pub-id>, PMID: <pub-id pub-id-type="pmid">28377903</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jung</surname><given-names>Y.</given-names></name> <name><surname>Han</surname><given-names>D.</given-names></name></person-group> (<year>2022</year>). <article-title>BWA-MEME: BWA-MEM emulated with a machine learning approach</article-title>. <source>Bioinformatics</source> <volume>38</volume>, <fpage>2404</fpage>&#x2013;<lpage>2413</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btac137</pub-id>, PMID: <pub-id pub-id-type="pmid">35253835</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kalyaanamoorthy</surname><given-names>S.</given-names></name> <name><surname>Minh</surname><given-names>B. Q.</given-names></name> <name><surname>Wong</surname><given-names>T. K. F.</given-names></name> <name><surname>von Haeseler</surname><given-names>A.</given-names></name> <name><surname>Jermiin</surname><given-names>L. S.</given-names></name></person-group> (<year>2017</year>). <article-title>ModelFinder: fast model selection for accurate phylogenetic estimates</article-title>. <source>Nat. Methods</source> <volume>14</volume>, <fpage>587</fpage>&#x2013;<lpage>589</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nmeth.4285</pub-id>, PMID: <pub-id pub-id-type="pmid">28481363</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kille</surname><given-names>B.</given-names></name> <name><surname>Nute</surname><given-names>M. G.</given-names></name> <name><surname>Huang</surname><given-names>V.</given-names></name> <name><surname>Kim</surname><given-names>E.</given-names></name> <name><surname>Phillippy</surname><given-names>A. M.</given-names></name> <name><surname>Treangen</surname><given-names>T. J.</given-names></name></person-group> (<year>2024</year>). <article-title>Parsnp 2.0: scalable core-genome alignment for massive microbial datasets</article-title>. <source>Bioinformatics</source> <volume>40</volume>:<fpage>btae311</fpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btae311</pub-id>, PMID: <pub-id pub-id-type="pmid">38724243</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koch</surname><given-names>A.</given-names></name> <name><surname>Mizrahi</surname><given-names>V.</given-names></name></person-group> (<year>2018</year>). <article-title>Mycobacterium tuberculosis</article-title>. <source>Trends Microbiol.</source> <volume>26</volume>, <fpage>555</fpage>&#x2013;<lpage>556</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tim.2018.02.012</pub-id>, PMID: <pub-id pub-id-type="pmid">29580884</pub-id></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lanfear</surname><given-names>R.</given-names></name> <name><surname>Frandsen</surname><given-names>P. B.</given-names></name> <name><surname>Wright</surname><given-names>A. M.</given-names></name> <name><surname>Senfeld</surname><given-names>T.</given-names></name> <name><surname>Calcott</surname><given-names>B.</given-names></name></person-group> (<year>2017</year>). <article-title>Partitionfinder 2: new methods for selecting partitioned models of evolution for molecular and morphological phylogenetic analyses</article-title>. <source>Mol. Biol. Evol.</source> <volume>34</volume>, <fpage>772</fpage>&#x2013;<lpage>773</lpage>. doi: <pub-id pub-id-type="doi">10.1093/molbev/msw260</pub-id>, PMID: <pub-id pub-id-type="pmid">28013191</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lavender</surname><given-names>C.</given-names></name> <name><surname>Globan</surname><given-names>M.</given-names></name> <name><surname>Sievers</surname><given-names>A.</given-names></name> <name><surname>Billman-Jacobe</surname><given-names>H.</given-names></name> <name><surname>Fyfe</surname><given-names>J.</given-names></name></person-group> (<year>2005</year>). <article-title>Molecular characterization of isoniazid-resistant <italic>Mycobacterium tuberculosis</italic> isolates collected in Australia</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>49</volume>, <fpage>4068</fpage>&#x2013;<lpage>4074</lpage>. doi: <pub-id pub-id-type="doi">10.1128/aac.49.10.4068-4074.2005</pub-id>, PMID: <pub-id pub-id-type="pmid">16189082</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>H.</given-names></name> <name><surname>Cho</surname><given-names>S. N.</given-names></name> <name><surname>Bang</surname><given-names>H. E.</given-names></name> <name><surname>Lee</surname><given-names>J. H.</given-names></name> <name><surname>Bai</surname><given-names>G. H.</given-names></name> <name><surname>Kim</surname><given-names>S. J.</given-names></name> <etal/></person-group>. (<year>2000</year>). <article-title>Exclusive mutations related to isoniazid and ethionamide resistance among <italic>Mycobacterium tuberculosis</italic> isolates from Korea</article-title>. <source>Int. J. Tuberc. Lung Dis.</source> <volume>4</volume>, <fpage>441</fpage>&#x2013;<lpage>447</lpage>.</citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname><given-names>A. S.</given-names></name> <name><surname>Othman</surname><given-names>S. N.</given-names></name> <name><surname>Ho</surname><given-names>Y. M.</given-names></name> <name><surname>Wong</surname><given-names>S. Y.</given-names></name></person-group> (<year>2004</year>). <article-title>Novel mutations within the <italic>embB</italic> gene in ethambutol-susceptible clinical isolates of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>48</volume>, <fpage>4447</fpage>&#x2013;<lpage>4449</lpage>. doi: <pub-id pub-id-type="doi">10.1128/aac.48.11.4447-4449.2004</pub-id>, PMID: <pub-id pub-id-type="pmid">15504879</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Letunic</surname><given-names>I.</given-names></name> <name><surname>Bork</surname><given-names>P.</given-names></name></person-group> (<year>2021</year>). <article-title>Interactive Tree of Life (iTOL) v5: an online tool for phylogenetic tree display and annotation</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>W293</fpage>&#x2013;<lpage>W296</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkab301</pub-id>, PMID: <pub-id pub-id-type="pmid">33885785</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>L.</given-names></name> <name><surname>Stoeckert</surname><given-names>C. J.</given-names> <suffix>Jr.</suffix></name> <name><surname>Roos</surname><given-names>D. S.</given-names></name></person-group> (<year>2003</year>). <article-title>OrthoMCL: identification of ortholog groups for eukaryotic genomes</article-title>. <source>Genome Res.</source> <volume>13</volume>, <fpage>2178</fpage>&#x2013;<lpage>2189</lpage>. doi: <pub-id pub-id-type="doi">10.1101/gr.1224503</pub-id>, PMID: <pub-id pub-id-type="pmid">12952885</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>D.</given-names></name> <name><surname>Zhang</surname><given-names>Y.</given-names></name> <name><surname>Fan</surname><given-names>G.</given-names></name> <name><surname>Sun</surname><given-names>D.</given-names></name> <name><surname>Zhang</surname><given-names>X.</given-names></name> <name><surname>Yu</surname><given-names>Z.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>IPGA: a handy integrated prokaryotes genome and pan-genome analysis web service</article-title>. <source>iMeta</source> <volume>1</volume>:<fpage>e55</fpage>. doi: <pub-id pub-id-type="doi">10.1002/imt2.55</pub-id>, PMID: <pub-id pub-id-type="pmid">38867900</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname><given-names>R.</given-names></name> <name><surname>Liu</surname><given-names>B.</given-names></name> <name><surname>Xie</surname><given-names>Y.</given-names></name> <name><surname>Li</surname><given-names>Z.</given-names></name> <name><surname>Huang</surname><given-names>W.</given-names></name> <name><surname>Yuan</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>SOAPdenovo2: an empirically improved memory-efficient short-read de novo assembler</article-title>. <source>GigaScience</source> <volume>1</volume>:<fpage>18</fpage>. doi: <pub-id pub-id-type="doi">10.1186/2047-217x-1-18</pub-id>, PMID: <pub-id pub-id-type="pmid">23587118</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Manni</surname><given-names>M.</given-names></name> <name><surname>Berkeley</surname><given-names>M. R.</given-names></name> <name><surname>Seppey</surname><given-names>M.</given-names></name> <name><surname>Sim&#x00E3;o</surname><given-names>F. A.</given-names></name> <name><surname>Zdobnov</surname><given-names>E. M.</given-names></name></person-group> (<year>2021</year>). <article-title>BUSCO update: novel and streamlined workflows along with broader and deeper phylogenetic coverage for scoring of eukaryotic, prokaryotic, and viral genomes</article-title>. <source>Mol. Biol. Evol.</source> <volume>38</volume>, <fpage>4647</fpage>&#x2013;<lpage>4654</lpage>. doi: <pub-id pub-id-type="doi">10.1093/molbev/msab199</pub-id>, PMID: <pub-id pub-id-type="pmid">34320186</pub-id></citation></ref>
<ref id="ref46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Minh</surname><given-names>B. Q.</given-names></name> <name><surname>Schmidt</surname><given-names>H. A.</given-names></name> <name><surname>Chernomor</surname><given-names>O.</given-names></name> <name><surname>Schrempf</surname><given-names>D.</given-names></name> <name><surname>Woodhams</surname><given-names>M. D.</given-names></name> <name><surname>von Haeseler</surname><given-names>A.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>IQ-TREE 2: new models and efficient methods for phylogenetic inference in the genomic era</article-title>. <source>Mol. Biol. Evol.</source> <volume>37</volume>, <fpage>1530</fpage>&#x2013;<lpage>1534</lpage>. doi: <pub-id pub-id-type="doi">10.1093/molbev/msaa015</pub-id>, PMID: <pub-id pub-id-type="pmid">32011700</pub-id></citation></ref>
<ref id="ref47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morlock</surname><given-names>G. P.</given-names></name> <name><surname>Metchock</surname><given-names>B.</given-names></name> <name><surname>Sikes</surname><given-names>D.</given-names></name> <name><surname>Crawford</surname><given-names>J. T.</given-names></name> <name><surname>Cooksey</surname><given-names>R. C.</given-names></name></person-group> (<year>2003</year>). <article-title>ethA, inhA, and katG loci of ethionamide-resistant clinical <italic>Mycobacterium tuberculosis</italic> isolates</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>47</volume>, <fpage>3799</fpage>&#x2013;<lpage>3805</lpage>. doi: <pub-id pub-id-type="doi">10.1128/aac.47.12.3799-3805.2003</pub-id>, PMID: <pub-id pub-id-type="pmid">14638486</pub-id></citation></ref>
<ref id="ref48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>M&#x00FC;ller</surname><given-names>B.</given-names></name> <name><surname>Borrell</surname><given-names>S.</given-names></name> <name><surname>Rose</surname><given-names>G.</given-names></name> <name><surname>Gagneux</surname><given-names>S.</given-names></name></person-group> (<year>2013</year>). <article-title>The heterogeneous evolution of multidrug-resistant <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Trends Genet.</source> <volume>29</volume>, <fpage>160</fpage>&#x2013;<lpage>169</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tig.2012.11.005</pub-id>, PMID: <pub-id pub-id-type="pmid">23245857</pub-id></citation></ref>
<ref id="ref49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Napier</surname><given-names>G.</given-names></name> <name><surname>Campino</surname><given-names>S.</given-names></name> <name><surname>Merid</surname><given-names>Y.</given-names></name> <name><surname>Abebe</surname><given-names>M.</given-names></name> <name><surname>Woldeamanuel</surname><given-names>Y.</given-names></name> <name><surname>Aseffa</surname><given-names>A.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Robust barcoding and identification of <italic>Mycobacterium tuberculosis</italic> lineages for epidemiological and clinical studies</article-title>. <source>Genome Med.</source> <volume>12</volume>:<fpage>114</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13073-020-00817-3</pub-id>, PMID: <pub-id pub-id-type="pmid">33317631</pub-id></citation></ref>
<ref id="ref50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Page</surname><given-names>A. J.</given-names></name> <name><surname>Cummins</surname><given-names>C. A.</given-names></name> <name><surname>Hunt</surname><given-names>M.</given-names></name> <name><surname>Wong</surname><given-names>V. K.</given-names></name> <name><surname>Reuter</surname><given-names>S.</given-names></name> <name><surname>Holden</surname><given-names>M. T. G.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Roary: rapid large-scale prokaryote pan genome analysis</article-title>. <source>Bioinformatics</source> <volume>31</volume>, <fpage>3691</fpage>&#x2013;<lpage>3693</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btv421</pub-id>, PMID: <pub-id pub-id-type="pmid">26198102</pub-id></citation></ref>
<ref id="ref51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pal</surname><given-names>A.</given-names></name> <name><surname>Mohanty</surname><given-names>D.</given-names></name></person-group> (<year>2025</year>). <article-title>Machine learning-based approach for identification of new resistance associated mutations from whole genome sequences of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Bioinformatics Adv.</source> <volume>5</volume>:<fpage>vbaf050</fpage>. doi: <pub-id pub-id-type="doi">10.1093/bioadv/vbaf050</pub-id>, PMID: <pub-id pub-id-type="pmid">40125545</pub-id></citation></ref>
<ref id="ref52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parks</surname><given-names>D. H.</given-names></name> <name><surname>Imelfort</surname><given-names>M.</given-names></name> <name><surname>Skennerton</surname><given-names>C. T.</given-names></name> <name><surname>Hugenholtz</surname><given-names>P.</given-names></name> <name><surname>Tyson</surname><given-names>G. W.</given-names></name></person-group> (<year>2015</year>). <article-title>CheckM: assessing the quality of microbial genomes recovered from isolates, single cells, and metagenomes</article-title>. <source>Genome Res.</source> <volume>25</volume>, <fpage>1043</fpage>&#x2013;<lpage>1055</lpage>. doi: <pub-id pub-id-type="doi">10.1101/gr.186072.114</pub-id>, PMID: <pub-id pub-id-type="pmid">25977477</pub-id></citation></ref>
<ref id="ref53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Qadir</surname><given-names>M.</given-names></name> <name><surname>Khan</surname><given-names>M. T.</given-names></name> <name><surname>Khan</surname><given-names>S. A.</given-names></name> <name><surname>Akram</surname><given-names>M.</given-names></name> <name><surname>Canseco</surname><given-names>J. O.</given-names></name> <name><surname>Faryal</surname><given-names>R.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Unveiling the complexity of rifampicin drug susceptibility testing in <italic>Mycobacterium tuberculosis</italic>: comparative analysis with next-generation sequencing</article-title>. <source>J. Med. Microbiol.</source> <volume>73</volume>:<fpage>e1884</fpage>. doi: <pub-id pub-id-type="doi">10.1099/jmm.0.001884</pub-id>, PMID: <pub-id pub-id-type="pmid">39229883</pub-id></citation></ref>
<ref id="ref54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Quinlan</surname><given-names>A. R.</given-names></name> <name><surname>Hall</surname><given-names>I. M.</given-names></name></person-group> (<year>2010</year>). <article-title>BEDTools: a flexible suite of utilities for comparing genomic features</article-title>. <source>Bioinformatics</source> <volume>26</volume>, <fpage>841</fpage>&#x2013;<lpage>842</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btq033</pub-id>, PMID: <pub-id pub-id-type="pmid">20110278</pub-id></citation></ref>
<ref id="ref55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ramaswamy</surname><given-names>S. V.</given-names></name> <name><surname>Amin</surname><given-names>A. G.</given-names></name> <name><surname>G&#x00F6;ksel</surname><given-names>S.</given-names></name> <name><surname>Stager</surname><given-names>C. E.</given-names></name> <name><surname>Dou</surname><given-names>S. J.</given-names></name> <name><surname>El Sahly</surname><given-names>H.</given-names></name> <etal/></person-group>. (<year>2000</year>). <article-title>Molecular genetic analysis of nucleotide polymorphisms associated with ethambutol resistance in human isolates of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>44</volume>, <fpage>326</fpage>&#x2013;<lpage>336</lpage>. doi: <pub-id pub-id-type="doi">10.1128/aac.44.2.326-336.2000</pub-id>, PMID: <pub-id pub-id-type="pmid">10639358</pub-id></citation></ref>
<ref id="ref56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sekiguchi</surname><given-names>J.</given-names></name> <name><surname>Nakamura</surname><given-names>T.</given-names></name> <name><surname>Miyoshi-Akiyama</surname><given-names>T.</given-names></name> <name><surname>Kirikae</surname><given-names>F.</given-names></name> <name><surname>Kobayashi</surname><given-names>I.</given-names></name> <name><surname>Augustynowicz-Kopec</surname><given-names>E.</given-names></name> <etal/></person-group>. (<year>2007</year>). <article-title>Development and evaluation of a line probe assay for rapid identification of <italic>pncA</italic> mutations in pyrazinamide-resistant <italic>Mycobacterium tuberculosis</italic> strains</article-title>. <source>J. Clin. Microbiol.</source> <volume>45</volume>, <fpage>2802</fpage>&#x2013;<lpage>2807</lpage>. doi: <pub-id pub-id-type="doi">10.1128/jcm.00352-07</pub-id>, PMID: <pub-id pub-id-type="pmid">17596354</pub-id></citation></ref>
<ref id="ref57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shaku</surname><given-names>M. T.</given-names></name> <name><surname>Bishai</surname><given-names>W. R.</given-names></name></person-group> (<year>2022</year>). <article-title><italic>Mycobacterium tuberculosis</italic>: a pathogen that can hold its breath a long time</article-title>. <source>Am. J. Respir. Crit. Care Med.</source> <volume>206</volume>, <fpage>10</fpage>&#x2013;<lpage>12</lpage>. doi: <pub-id pub-id-type="doi">10.1164/rccm.202203-0432ED</pub-id>, PMID: <pub-id pub-id-type="pmid">35442854</pub-id></citation></ref>
<ref id="ref58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shi</surname><given-names>R.</given-names></name> <name><surname>Zhang</surname><given-names>J.</given-names></name> <name><surname>Li</surname><given-names>C.</given-names></name> <name><surname>Kazumi</surname><given-names>Y.</given-names></name> <name><surname>Sugawara</surname><given-names>I.</given-names></name></person-group> (<year>2006</year>). <article-title>Emergence of ofloxacin resistance in <italic>Mycobacterium tuberculosis</italic> clinical isolates from China as determined by gyrA mutation analysis using denaturing high-pressure liquid chromatography and DNA sequencing</article-title>. <source>J. Clin. Microbiol.</source> <volume>44</volume>, <fpage>4566</fpage>&#x2013;<lpage>4568</lpage>. doi: <pub-id pub-id-type="doi">10.1128/jcm.01916-06</pub-id>, PMID: <pub-id pub-id-type="pmid">17035499</pub-id></citation></ref>
<ref id="ref59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shitikov</surname><given-names>E.</given-names></name> <name><surname>Bespiatykh</surname><given-names>D.</given-names></name></person-group> (<year>2023</year>). <article-title>A revised SNP-based barcoding scheme for typing <italic>Mycobacterium tuberculosis</italic> complex isolates</article-title>. <source>mSphere</source> <volume>8</volume>:<fpage>e0016923</fpage>. doi: <pub-id pub-id-type="doi">10.1128/msphere.00169-23</pub-id>, PMID: <pub-id pub-id-type="pmid">37314207</pub-id></citation></ref>
<ref id="ref60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shu</surname><given-names>W.</given-names></name> <name><surname>Liu</surname><given-names>Y. H.</given-names></name></person-group> (<year>2024</year>). <article-title>Interpretation of WHO global tuberculosis report 2023</article-title>. <source>J. Tuberc. Lung Dis.</source> <volume>5</volume>, <fpage>15</fpage>&#x2013;<lpage>19</lpage>. doi: <pub-id pub-id-type="doi">10.19983/j.issn.2096-8493.2024006</pub-id></citation></ref>
<ref id="ref61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname><given-names>R.</given-names></name> <name><surname>Dwivedi</surname><given-names>S. P.</given-names></name> <name><surname>Gaharwar</surname><given-names>U. S.</given-names></name> <name><surname>Meena</surname><given-names>R.</given-names></name> <name><surname>Rajamani</surname><given-names>P.</given-names></name> <name><surname>Prasad</surname><given-names>T.</given-names></name></person-group> (<year>2020</year>). <article-title>Recent updates on drug resistance in <italic>Mycobacterium tuberculosis</italic></article-title>. <source>J. Appl. Microbiol.</source> <volume>128</volume>, <fpage>1547</fpage>&#x2013;<lpage>1567</lpage>. doi: <pub-id pub-id-type="doi">10.1111/jam.14478</pub-id>, PMID: <pub-id pub-id-type="pmid">31595643</pub-id></citation></ref>
<ref id="ref62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sreevatsan</surname><given-names>S.</given-names></name> <name><surname>Stockbauer</surname><given-names>K. E.</given-names></name> <name><surname>Pan</surname><given-names>X.</given-names></name> <name><surname>Kreiswirth</surname><given-names>B. N.</given-names></name> <name><surname>Moghazeh</surname><given-names>S. L.</given-names></name> <name><surname>Jacobs</surname><given-names>W. R.</given-names> <suffix>Jr.</suffix></name> <etal/></person-group>. (<year>1997</year>). <article-title>Ethambutol resistance in <italic>Mycobacterium tuberculosis</italic>: critical role of embB mutations</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>41</volume>, <fpage>1677</fpage>&#x2013;<lpage>1681</lpage>. doi: <pub-id pub-id-type="doi">10.1128/aac.41.8.1677</pub-id>, PMID: <pub-id pub-id-type="pmid">9257740</pub-id></citation></ref>
<ref id="ref63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Srivastava</surname><given-names>S.</given-names></name> <name><surname>Ayyagari</surname><given-names>A.</given-names></name> <name><surname>Dhole</surname><given-names>T. N.</given-names></name> <name><surname>Nyati</surname><given-names>K. K.</given-names></name> <name><surname>Dwivedi</surname><given-names>S. K.</given-names></name></person-group> (<year>2009</year>). <article-title>emb nucleotide polymorphisms and the role of embB306 mutations in <italic>Mycobacterium tuberculosis</italic> resistance to ethambutol</article-title>. <source>Int. J. Med. Microbiol.</source> <volume>299</volume>, <fpage>269</fpage>&#x2013;<lpage>280</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ijmm.2008.07.001</pub-id>, PMID: <pub-id pub-id-type="pmid">19010731</pub-id></citation></ref>
<ref id="ref64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Srivastava</surname><given-names>S.</given-names></name> <name><surname>Garg</surname><given-names>A.</given-names></name> <name><surname>Ayyagari</surname><given-names>A.</given-names></name> <name><surname>Nyati</surname><given-names>K. K.</given-names></name> <name><surname>Dhole</surname><given-names>T. N.</given-names></name> <name><surname>Dwivedi</surname><given-names>S. K.</given-names></name></person-group> (<year>2006</year>). <article-title>Nucleotide polymorphism associated with ethambutol resistance in clinical isolates of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Curr. Microbiol.</source> <volume>53</volume>, <fpage>401</fpage>&#x2013;<lpage>405</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00284-006-0135-1</pub-id>, PMID: <pub-id pub-id-type="pmid">16972132</pub-id></citation></ref>
<ref id="ref65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tonkin-Hill</surname><given-names>G.</given-names></name> <name><surname>MacAlasdair</surname><given-names>N.</given-names></name> <name><surname>Ruis</surname><given-names>C.</given-names></name> <name><surname>Weimann</surname><given-names>A.</given-names></name> <name><surname>Horesh</surname><given-names>G.</given-names></name> <name><surname>Lees</surname><given-names>J. A.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Producing polished prokaryotic pangenomes with the Panaroo pipeline</article-title>. <source>Genome Biol.</source> <volume>21</volume>:<fpage>180</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13059-020-02090-4</pub-id>, PMID: <pub-id pub-id-type="pmid">32698896</pub-id></citation></ref>
<ref id="ref66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van der Auwera</surname><given-names>G. A.</given-names></name> <name><surname>Carneiro</surname><given-names>M. O.</given-names></name> <name><surname>Hartl</surname><given-names>C.</given-names></name> <name><surname>Poplin</surname><given-names>R.</given-names></name> <name><surname>Del Angel</surname><given-names>G.</given-names></name> <name><surname>Levy-Moonshine</surname><given-names>A.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>From fastQ data to high confidence variant calls: the genome analysis toolkit best practices pipeline</article-title>. <source>Curr. Protoc. Bioinform.</source> <volume>43</volume>, <fpage>11.10.11</fpage>&#x2013;<lpage>11.10.33</lpage>. doi: <pub-id pub-id-type="doi">10.1002/0471250953.bi1110s43</pub-id></citation></ref>
<ref id="ref67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Willby</surname><given-names>M. J.</given-names></name> <name><surname>Wijkander</surname><given-names>M.</given-names></name> <name><surname>Havumaki</surname><given-names>J.</given-names></name> <name><surname>Johnson</surname><given-names>K.</given-names></name> <name><surname>Werngren</surname><given-names>J.</given-names></name> <name><surname>Hoffner</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Detection of <italic>Mycobacterium tuberculosis</italic> pncA mutations by the Nipro Genoscholar PZA-TB II assay compared to conventional sequencing</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>62</volume>:<fpage>e01871-17</fpage>. doi: <pub-id pub-id-type="doi">10.1128/aac.01871-17</pub-id>, PMID: <pub-id pub-id-type="pmid">29084743</pub-id></citation></ref>
<ref id="ref68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wulandari</surname><given-names>D. A.</given-names></name> <name><surname>Hartati</surname><given-names>Y. W.</given-names></name> <name><surname>Ibrahim</surname><given-names>A. U.</given-names></name> <name><surname>Pitaloka</surname><given-names>D. A. E.</given-names></name> <name><surname>Irkham</surname></name></person-group> (<year>2024</year>). <article-title>Multidrug-resistant tuberculosis</article-title>. <source>Clin. Chim. Acta</source> <volume>559</volume>:<fpage>119701</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cca.2024.119701</pub-id></citation></ref>
<ref id="ref69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>Z.</given-names></name></person-group> (<year>2022</year>). <article-title><italic>K</italic><sub>a</sub><italic>K</italic><sub>s</sub>_Calculator 3.0: calculating selective pressure on coding and non-coding sequences</article-title>. <source>Genomics Proteomics Bioinformatics</source> <volume>20</volume>, <fpage>536</fpage>&#x2013;<lpage>540</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.gpb.2021.12.002</pub-id>, PMID: <pub-id pub-id-type="pmid">34990803</pub-id></citation></ref>
<ref id="ref70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>D.</given-names></name> <name><surname>Gao</surname><given-names>F.</given-names></name> <name><surname>Jakovli&#x0107;</surname><given-names>I.</given-names></name> <name><surname>Zou</surname><given-names>H.</given-names></name> <name><surname>Zhang</surname><given-names>J.</given-names></name> <name><surname>Li</surname><given-names>W. X.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>PhyloSuite: an integrated and scalable desktop platform for streamlined molecular sequence data management and evolutionary phylogenetics studies</article-title>. <source>Mol. Ecol. Resour.</source> <volume>20</volume>, <fpage>348</fpage>&#x2013;<lpage>355</lpage>. doi: <pub-id pub-id-type="doi">10.1111/1755-0998.13096</pub-id>, PMID: <pub-id pub-id-type="pmid">31599058</pub-id></citation></ref>
<ref id="ref71"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>Z.</given-names></name> <name><surname>Xiao</surname><given-names>J.</given-names></name> <name><surname>Wu</surname><given-names>J.</given-names></name> <name><surname>Zhang</surname><given-names>H.</given-names></name> <name><surname>Liu</surname><given-names>G.</given-names></name> <name><surname>Wang</surname><given-names>X.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>ParaAT: a parallel tool for constructing multiple protein-coding DNA alignments</article-title>. <source>Biochem. Biophys. Res. Commun.</source> <volume>419</volume>, <fpage>779</fpage>&#x2013;<lpage>781</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.bbrc.2012.02.101</pub-id>, PMID: <pub-id pub-id-type="pmid">22390928</pub-id></citation></ref>
</ref-list>
</back>
</article>