<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2025.1537826</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Benchmarking pangenome dynamics and horizontal gene transfer in <italic>Mycobacterium marinum</italic> evolution</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name><surname>Shahed</surname> <given-names>Khandker</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes">
<name><surname>Islam</surname> <given-names>Sk Injamamul</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2284497/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sangsawad</surname> <given-names>Papungkorn</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Jung</surname> <given-names>Won-Kyo</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Permpoonpattana</surname> <given-names>Patima</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Linh</surname> <given-names>Nguyen Vu</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="c003"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1729457/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>BioMac Lab</institution>, <addr-line>Dhaka</addr-line>, <country>Bangladesh</country></aff>
<aff id="aff2"><sup>2</sup><institution>School of Animal Technology and Innovation, Institute of Agricultural Technology, Suranaree University of Technology</institution>, <addr-line>Nakhon Ratchasima</addr-line>, <country>Thailand</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Agricultural Science and Technology, Faculty of Innovative Agriculture, Fisheries and Food, Prince of Songkla University, Surat Thani Campus</institution>, <addr-line>Surat Thani</addr-line>, <country>Thailand</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Animal and Aquatic Sciences, Faculty of Agriculture, Chiang Mai University</institution>, <addr-line>Chiang Mai</addr-line>, <country>Thailand</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Svetlana Khaiboullina, University of Nevada, Reno, United States</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: James T. Tambong, Agriculture and Agri-Food Canada (AAFC), Canada</p><p>Ketan Patel, Centers for Disease Control and Prevention (CDC), United States</p></fn>
<corresp id="c001">&#x002A;Correspondence: Patima Permpoonpattana, <email>patima.pe@psu.ac.th</email></corresp>
<corresp id="c002">Sk Injamamul Islam, <email>injamamulislam017@gmail.com</email></corresp>
<corresp id="c003">Nguyen Vu Linh, <email>linhvu.n@cmu.ac.th</email></corresp>
<fn fn-type="equal" id="fn002"><p><sup>&#x2020;</sup>These authors share first authorship</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>06</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1537826</elocation-id>
<history>
<date date-type="received">
<day>01</day>
<month>12</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>05</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Shahed, Islam, Sangsawad, Jung, Permpoonpattana and Linh.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Shahed, Islam, Sangsawad, Jung, Permpoonpattana and Linh</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Horizontal gene transfer (HGT) is a key driver of microbial evolution, promoting genetic diversity and contributing to the emergence of antibiotic resistance. This study explores the pangenome dynamics and HGT in <italic>Mycobacterium marinum</italic> (<italic>M. marinum</italic>), a close relative of <italic>Mycobacterium tuberculosis</italic>. Multiple pangenome datasets were analyzed to quantify gene gain, loss, and pangenome openness, utilizing Panstripe and a Generalized Linear Model (GLM) framework to assess gene presence/absence across strains. Additionally, a comparative benchmarking analysis of gene ontology (GO) annotations were conducted using eggNOG and InterProScan to evaluate their functional annotation accuracy. Our findings demonstrated significant differences in gene gain and loss rates, suggesting variations in annotation accuracy and the presence of mobile genetic elements (MGE). Single nucleotide polymorphisms (SNPs) were also identified, highlighting the genetic variability that may impact strain-specific traits such as pathogenicity and antibiotic resistance. Pangenome of <italic>M. marinum</italic> was characterized as highly open, with substantial variability in gene content, reflecting ongoing genetic exchange and adaptability. Functional annotation benchmarking demonstrated that eggNOG and InterProScan provided complementary insights, with each tool excelling in distinct strengths of gene function identification. Overall, these findings highlight the complex interplay between HGT, pangenome evolution, and antibiotic resistance in <italic>M. marinum</italic>, and the analytical framework presented here provides a robust approach for future studies aiming to inform therapeutic interventions and vaccine development.</p>
</abstract>
<kwd-group>
<kwd>benchmark</kwd>
<kwd>pathogens</kwd>
<kwd>genome</kwd>
<kwd>alternatives to antibiotic</kwd>
<kwd>SNPs</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="70"/>
<page-count count="13"/>
<word-count count="8198"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Aquatic Microbiology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>1 Introduction</title>
<p><italic>Mycobacterium marinum</italic> causes tuberculosis-like disease in poikilothermic animals and acts as an opportunistic pathogen in humans, typically manifesting as localized skin infections due to its temperature-dependent growth restriction (<xref ref-type="bibr" rid="B46">Ramakrishnan and Falkow, 1994</xref>). Unlike <italic>Mycobacterium tuberculosis</italic>, which has adapted specifically to humans, <italic>M. marinum</italic> retains a generalist ecological strategy, infecting diverse animal hosts and protozoa. Despite its larger genome, <italic>M. marinum</italic> shares close phylogenetic ties with <italic>M. tuberculosis</italic>, and exhibits striking similarities in cellular infection mechanisms (<xref ref-type="bibr" rid="B9">Cardenal-Mu&#x00F1;oz et al., 2018</xref>; <xref ref-type="bibr" rid="B54">Stinear et al., 2008</xref>). Originally misclassified as <italic>M. piscium</italic> due to its association with marine fish, <italic>M. marinum</italic> is now recognized as a globally distributed pathogen (<xref ref-type="bibr" rid="B4">Aubry et al., 2017</xref>). It thrives in diverse aquatic environment&#x2014;saltwater, brackish systems, and both stagnant and flowing freshwater&#x2014;infecting over 150 fish, frog, eel and oyster species (<xref ref-type="bibr" rid="B2">Aronson, 1926</xref>; <xref ref-type="bibr" rid="B6">Beecham et al., 1991</xref>). Human infections are generally cutaneous, though immunocompromised individuals may experience deeper tissue invasion or systemic spread (<xref ref-type="bibr" rid="B62">Tsiolakkis et al., 2023</xref>). Scientific interest in <italic>M. marinum</italic> stems from its genetic similarity to <italic>M. tuberculosis</italic> and its utility in modeling tuberculosis pathogenesis using goldfish (<italic>Carassius auratus</italic>) (<xref ref-type="bibr" rid="B50">Ruley et al., 2004</xref>). Recent attention has intensified due to parallels with <italic>M. ulcerans</italic> infections and the growing popularity of aquarium-related activities. which may elevate clinical case rates (<xref ref-type="bibr" rid="B4">Aubry et al., 2017</xref>).</p>
<p>Pathogenetically, <italic>M. marinum</italic> and <italic>M. ulcerans</italic> from a distinct pathogenic clade within non-tuberculous mycobacteria (NTM) (<xref ref-type="bibr" rid="B66">Wolinsky, 1992</xref>), sharing &#x003E; 98% nucleotide identity with <italic>M. ulcerans</italic> in key biomarkers, including <italic>16S rRNA</italic>, <italic>rpoB</italic>, <italic>gyrA/B</italic>, and <italic>hsp65</italic> (<xref ref-type="bibr" rid="B12">Dauendorffer et al., 2003</xref>; <xref ref-type="bibr" rid="B53">Stinear et al., 2000</xref>; <xref ref-type="bibr" rid="B54">Stinear et al., 2008</xref>). Early genomic comparisons of <italic>M. marinum</italic> strains (MB2, Europe, and the human-derived M strain) suggested highly similarity (<xref ref-type="bibr" rid="B32">Kurokawa et al., 2013</xref>), but expanded analyses of 15 human- and fish-derived isolates revealed unexpected genomic diversity (<xref ref-type="bibr" rid="B11">Das et al., 2018</xref>). Divergence primarily affects lipid metabolism, virulence factors, stress response pathways, underscoring the need for complete genome-based comparisons to resolve strain-specific adaptations (<xref ref-type="bibr" rid="B65">Vasudevan et al., 2020</xref>). DNA-DNA hybridization and mycolic acid profiling further confirm <italic>M. marinum</italic> and <italic>M. ulcerans</italic> as the closest relatives of <italic>M. tuberculosis</italic> (<xref ref-type="bibr" rid="B49">Rogall et al., 1990</xref>; <xref ref-type="bibr" rid="B58">T&#x00F8;njum et al., 1998</xref>).</p>
<p>Advances in whole-genome sequencing have revolutionized bacterial phylogenetics, enabling precise strain typing, antibiotic resistance profiling, and outbreak surveillance (<xref ref-type="bibr" rid="B1">Abdella et al., 2023</xref>; <xref ref-type="bibr" rid="B29">Jin et al., 2020</xref>; <xref ref-type="bibr" rid="B41">P&#x00E9;rez-Pascual et al., 2017</xref>). While prior studies explored <italic>M. marinum</italic>&#x2019;s genetic relationships (<xref ref-type="bibr" rid="B11">Das et al., 2018</xref>; <xref ref-type="bibr" rid="B32">Kurokawa et al., 2013</xref>), critical gaps remain in linking genomic diversity to atypical virulence factors and antimicrobial resistance (AMR). The growing availability of complete genomes now permits robust pangenome analyses, which are essential for distinguishing core and accessory genes, identifying SNPs/indels, and resolving taxonomic ambiguities (<xref ref-type="bibr" rid="B47">Reis and Cunha, 2021</xref>). Such approaches also address the limitations of traditional biomarkers, which often fail to capture taxonomy relationships across bacterial serotypes.</p>
<p>Horizontal gene transfer (HTG)&#x2014;a primary driver of virulence and AMR genes acquisition&#x2014;further complicates <italic>M. marinum</italic>&#x2019;s genomic landscape (<xref ref-type="bibr" rid="B37">Mahmoud et al., 2022</xref>). To clarify these dynamics, a comparative genomics on eight complete genomes of <italic>M. marinum</italic> was performed. Subsequently, the pangenome and core genome were defined, and the average nucleotide identity (ANI) was calculated. The pangenome gain and loss rate was also analyzed. Collectively, this study would provide insights into the genomic features of the species and reveal highly conserved virulence genes along with their associations with antimicrobial drug resistance.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>2 Materials and methods</title>
<sec id="S2.SS1">
<title>2.1 <italic>Mycobacterium marinum</italic> dataset selection and quality assessment</title>
<p>A total of 100 distinct <italic>M. marinum</italic> genome sequences (including contigs, scaffolds, chromosomes, and complete sequences) are currently available in the NCBI genome database. On September 12, 2024, 8 complete genomes of <italic>M. marinum</italic> were downloaded. To further refine the data, the CheckM program (version 1.2.1) (<xref ref-type="bibr" rid="B40">Parks et al., 2022</xref>) was employed for genome quality filtration. The criteria for genome completeness were set at a minimum of 90%, while the maximum allowed contamination was 5%. Recent studies have emphasized the importance of selecting a high-quality and appropriate dataset for pangenome research (<xref ref-type="bibr" rid="B68">Wu et al., 2021</xref>; <xref ref-type="bibr" rid="B69">Wu et al., 2022</xref>). This careful selection ensures the reliability of downstream analyses, leading to more robust insights into pangenome and potential SNPs within the species. <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref> presents genome assembly, accession numbers, and genomic information, including genome size, gene count, and protein-coding genes. Only whole genomes were analyzed to ensure the most accurate representation of strain virulence genes and potential identifying biomarkers.</p>
</sec>
<sec id="S2.SS2">
<title>2.2 Average nucleotide identity</title>
<p>To verify species relationships, we performed nucleotide-level comparisons of all potential genome combinations using the ANI approach. The Python script PyANI v0.2.722 was used to compute pairwise ANI values using two different methods, the MUMmer (<xref ref-type="bibr" rid="B33">Kurtz et al., 2004</xref>) and the BLAST + method (<xref ref-type="bibr" rid="B7">Camacho et al., 2009</xref>) employing the ANIm and ANIb options, respectively. All strains classified as <italic>M. marinum</italic> were chosen for further analysis, while those misidentified were discarded. This decision was based on setting a threshold value indicating that the ANI of the same species exceeds 94% (<xref ref-type="bibr" rid="B23">Goris et al., 2007</xref>; <xref ref-type="bibr" rid="B48">Richter and Rossell&#x00F3;-M&#x00F3;ra, 2009</xref>).</p>
</sec>
<sec id="S2.SS3">
<title>2.3 Building pangenome</title>
<p>To maintain consistency and standardization, the genomes of the <italic>M. marinum</italic> strains examined were re-annotated for their functional attributes using the Prokka suite version 1.14.6 (<xref ref-type="bibr" rid="B43">Podrzaj et al., 2022</xref>). The software Roary (<xref ref-type="bibr" rid="B39">Page et al., 2015</xref>) and Panaroo (<xref ref-type="bibr" rid="B60">Tonkin-Hill et al., 2020</xref>) with a default identity threshold of 95%, was employed to construct the core and pan-genome of <italic>M. marinum</italic>. Briefly, genes have been categorized into four distinct groups: core genes, present in more than 99% of genomes; softcore genes, found in most strains, specifically in over 95% but fewer than 99%; shell genes, identified in 15% to less than 95% of the strains; and cloud genes, which are observed in fewer than 15% of the total strains. In addition, the pangenome was analyzed using Heap&#x2019;s Law (<xref ref-type="bibr" rid="B45">Rajput et al., 2023</xref>) and Power Law fit (<xref ref-type="bibr" rid="B56">Tettelin et al., 2005</xref>) in conjunction with the custom script<sup><xref ref-type="fn" rid="footnote1">1</xref></sup> and the &#x201C;ggcaller v1.3.0&#x201D; in Python programing (<xref ref-type="bibr" rid="B24">Horsfield et al., 2023</xref>), respectively. This approach allowed for the calculation of constant variables and the application of the least squares method to fit an exponential regression decay model to both the core genome and singletons. Heap&#x2019;s Law was used to determine the fixed parameters from the pangenome with the formula n = &#x03BA;N<sup>&#x03B3;</sup>, where n represents the number of pangenome genes and N is the number of genomes, least-squares fit is represented by the equation n = k &#x00D7; exp [-x/t] + tg&#x03B8;, where n is the number of genes, and k, t, and tg&#x03B8; are independent variables (<xref ref-type="bibr" rid="B27">Islam et al., 2025</xref>; <xref ref-type="bibr" rid="B38">Mwamburi et al., 2024</xref>). This algorithm is utilized to ascertain the number of genes that will compose the core genome upon stabilization (<xref ref-type="bibr" rid="B52">Soares et al., 2013</xref>) and to offer an approximate calculation of the genes contributed by each freshly sequenced genome. Additionally, the complete pangenome for the entire dataset of genomes was generated using anvi&#x2019;o v8 (<xref ref-type="bibr" rid="B17">Eren et al., 2015</xref>), followed by the pangenomics procedure described in this guide: <ext-link ext-link-type="uri" xlink:href="https://merenlab.org/2016/11/08/pangenomics-v2/2/">https://merenlab.org/2016/11/08/pangenomics-v2/2/</ext-link>. In brief, the following scripts were executed: anvi-gen-contigs-database, utilized to create a database, with Prodigal v2.6.3 (<xref ref-type="bibr" rid="B26">Hyatt et al., 2010</xref>) for identifying open reading frames in contigs, and anvi-run-ncbi-cogs, which provided gene annotations by utilizing NCBI Clusters of Orthologous Groups database (<xref ref-type="bibr" rid="B55">Tatusov et al., 2000</xref>). The genome database was created using anvi-gen-genomes-storage and anvil-pan-genome for visualization. Anvi&#x2019;o employs the DIAMOND tool to compute the similarity between each amino acid sequence in every genome and all other amino acid sequences across all genomes in the dataset and then uses the MCL algorithm (<xref ref-type="bibr" rid="B64">van Dongen and Abreu-Goodger, 2012</xref>) to detect clusters in the results of amino acid sequence similarity.</p>
</sec>
<sec id="S2.SS4">
<title>2.4 Genome synteny and SNPs identification</title>
<p>Gene synteny analysis was performed using the Mauve program version snapshot_2015_02_13 (<xref ref-type="bibr" rid="B16">Edwards and Holt, 2013</xref>) and its progressive Mauve algorithm to detect potential gene rearrangement events. The software segmented the genomes into predefined fragments and used this information to perform numerous genome alignments. These alignments identified local collinear blocks (LCB) which were then visualized in a figure. This figure serves as a tool to identify and analyze rearrangements within the genomes. Subsequently, a customized Python script called msa2snp.py<sup><xref ref-type="fn" rid="footnote2">2</xref></sup> was employed to detect all SNPs within the target genes. The results of SNP identification were manually curated to identify the most informative SNP, found exclusively in all <italic>M. marinum</italic> complete genomes.</p>
</sec>
<sec id="S2.SS5">
<title>2.5 Functional annotation and identification of gene encoders</title>
<p>BLAST searches were performed for all protein-coding genes in the National Centre for Biotechnology Information (NCBI) database, which was accessed at <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/on">https://www.ncbi.nlm.nih.gov/on</ext-link> 20.09.2024. The entire genome, including repetitive elements, was annotated using eggNOG-mapper v2 (<xref ref-type="bibr" rid="B8">Cantalapiedra et al., 2021</xref>) and InterProScan (<xref ref-type="bibr" rid="B44">Quevillon et al., 2005</xref>) in a Linux environment. The sequence alignment process entailed mapping each sequence with either the hidden Markov model (HMM) or DIAMOND to match it with the eggNOG database. The ideal matching sequence of the target sequence is classified according to its taxonomy and further categorized and annotated utilizing gene ontology (GO) (<xref ref-type="bibr" rid="B22">Gene Ontology Consortium, 2015</xref>) and Kyoto Encyclopedia of Genes and Genomes (KEGG) pathways (<xref ref-type="bibr" rid="B31">Kanehisa et al., 2017</xref>) through the application of the clusterProfiler v.3.19 package in R (<xref ref-type="bibr" rid="B70">Xu et al., 2024</xref>). Furthermore, BLAST analysis was performed to examine the 80 genomes for the presence of genes linked to virulence and pathogenicity. We employed BLASTN via ABRicate v1.0.1<sup><xref ref-type="fn" rid="footnote3">3</xref></sup> (<xref ref-type="bibr" rid="B13">de Man and Limbago, 2016</xref>) and the Virulence Factor Database (VFDB) (<xref ref-type="bibr" rid="B36">Liu et al., 2022</xref>) to examine the occurrence of virulence factors and antibiotic resistance gene in all strains of <italic>M. marinum</italic>. The analysis was performed using a 90% identity threshold and a 30% coverage threshold.</p>
</sec>
<sec id="S2.SS6">
<title>2.6 Region of genomic plasticity</title>
<p>To investigate the RGP in eight complete genomes of <italic>M. marinum</italic>, PPanGGOLiN software<sup><xref ref-type="fn" rid="footnote4">4</xref></sup> (<xref ref-type="bibr" rid="B20">Gautreau et al., 2020</xref>) was utilized with &#x201C;panrgp&#x201D; command. Genomic plasticity regions, which include genomic islands, prophages, and other variable elements, were identified using PPanGGOLiN&#x2019;s comprehensive pangenome analysis capabilities. Initially, the genomes were prepared and formatted according to requirements based on the sample input dataset of the software. PPanGGOLiN was then employed to perform a detailed analysis, identifying regions of genomic variability and plasticity across the <italic>M. marinum</italic> strains. The tool provided insights into the distribution and composition of these plastic regions, allowing to map and characterize their presence and variability among the genomes. This analysis revealed the dynamic regions contributing to the genomic diversity and adaptability of <italic>M. marinum</italic>.</p>
</sec>
<sec id="S2.SS7">
<title>2.7 Pangenome gain and loss rate analysis</title>
<p>Horizontal gene transfer is a vital factor in the evolution and diversification of numerous microbial species. The ensuing dynamics of gene acquisition and loss can significantly impact the emergence of antibiotic resistance and influence the development of vaccines and therapeutic interventions (<xref ref-type="bibr" rid="B59">Tonkin-Hill et al., 2023</xref>). Panstripe<sup><xref ref-type="fn" rid="footnote5">5</xref></sup> improves the post-processing of bacterial pangenome analyses (<xref ref-type="bibr" rid="B59">Tonkin-Hill et al., 2023</xref>). Panstripe accepts a phylogeny and a gene presence/absence matrix in Rtab format, which can be generated by tools like Panaroo and Roary. Utilizing a Generalized Linear Model (GLM) framework allows for straightforward comparison of slope terms across different datasets. The &#x201C;compare_pangenomes&#x201D; function analyzes the interaction term between the datasets alongside the core, tip, and depth terms. A significant <italic>p</italic>-value for the tip term indicates that the two pangenomes differ in the rates of gene presence and absence observed at the tips of the phylogeny. This variation is often attributed to differences in annotation error rates between datasets or to fluctuations in the gain and loss of highly mobile genetic elements that may not persist long enough to be detected across multiple genomes. A significant <italic>p</italic>-value for the core term suggests differing rates of gene gain and loss between the two datasets. Although the depth term is less critical, it reflects discrepancies in the ability to detect older gene exchange events between the two pangenomes. The dispersion parameter reveals whether there is a notable difference in the dispersion of the two pangenomes, implying that the relationship between gene exchange rates and the size of each event varies between the two datasets. The <italic>p</italic>-value is derived using a Likelihood Ratio Test, and a subset of inferred GLM parameters can be analyzed. The resulting p-values and bootstrap confidence intervals can help assess the significance of each term in the model to gene gain and loss (<xref ref-type="bibr" rid="B59">Tonkin-Hill et al., 2023</xref>).</p>
</sec>
<sec id="S2.SS8">
<title>2.8 Egg-NOG-mapper vs. InterProScan</title>
<p>In this benchmarking analysis, we compared the annotation performance of EggNOG-mapper and InterProScan for <italic>M. marinum</italic>, focusing on metrics such as GO term accuracy, average GO terms per protein, and proteome coverage (<xref ref-type="bibr" rid="B25">Huerta-Cepas et al., 2017</xref>). Annotation files generated by each tool were parsed using the pandas library in Python v3.8, extracting relevant data such as GO terms and Pfam domains. The data were structured into a standardized format, capturing sets of GO terms, functional categories, and proteome coverage for both tools. To evaluate the performance of each tool, key metrics were calculated. These included the proportions of true positive (TP) and false positive (FP) annotations, which were used to assess the accuracy of GO term predictions. Additionally, the average number of GO terms per protein was computed to reflect the specificity of the annotations. Finally, proteome coverage was evaluated based on the proportion of proteins that were annotated with only TP terms, a mix of TP and FP terms, or no TP terms. This analysis provides a comparative framework for assessing annotation quality, highlighting the strengths and limitations of each tool&#x2019;s functional annotation capabilities for genomic studies.</p>
</sec>
</sec>
<sec id="S3" sec-type="results">
<title>3 Results</title>
<sec id="S3.SS1">
<title>3.1 Genomic features and ANI</title>
<p>The genomic features are represented in <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>, which lists the assembly accessions, organism infraspecific names, assembly release dates, number of scaffolds, and isolated species for eight complete genomes of <italic>M. marinum</italic>. Genetic variability between the fish isolates, such as E11, CCUG20998, and 1218R, and the human isolates, including H01, MMA1, and <italic>Mycobacterium</italic>, is minimal according to the ANI analysis (<xref ref-type="fig" rid="F1">Figure 1</xref>). The heatmap shows that the ANI percentages are consistently high, nearing or above 98%, indicating close genetic relatedness between strains from fish and human sources. This suggests that despite the different host origins, these <italic>M. marinum</italic> strains share significant genomic similarity.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>The pairwise average nucleotide identity (ANI) values for the eight complete <italic>M. marinum</italic> genomes are represented in this heat map, with distinct strains differentiated by color coding along the <italic>x</italic>- and <italic>y</italic>-axes. High similarity, indicated by the color red, suggests that the organisms belong to the same species.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-16-1537826-g001.tif"/>
</fig>
</sec>
<sec id="S3.SS2">
<title>3.2 Pangenome and core genome</title>
<p>Pangenome analysis of <italic>M. marinum</italic> based on the eight complete genome sequences reveals a large proportion of core genes and significant genomic diversity. The gene presence-absence matrix (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 1</xref>) showed a clear clustering of strains, with the core genome represented by 4634 gene clusters (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 2</xref>). This suggests that a substantial fraction of genes is conserved across all strains, indicating evolutionary stability in essential functions. Additionally, the shell genome comprises 1390 gene clusters, reflecting moderate variability among strains. No soft-core genes were detected, while 1758 gene clusters belong to the cloud genome, representing strain-specific genes. These cloud genes highlight the presence of unique, possibly adaptive, traits linked to the strain&#x2019;s environmental or host-specific pressures.</p>
<p><xref ref-type="fig" rid="F2">Figure 2</xref> displays a circular representation of the core genome and pan-genome of <italic>M. marinum</italic>. The outermost circle represents the core genome, which is shared by all strains. The inner circles represent the pan-genome, which consists of genes that are present in at least one strain. The pangenome analysis reveals that the core genome of <italic>M. marinum</italic> is relatively small, suggesting that the species has a high degree of genetic diversity. The presence of many singleton genes in each strain suggests that <italic>M. marinum</italic> is rapidly evolving and adapting to different environments.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>The visualization of the pangenome of <italic>M. marinum</italic> was conducted by performing Anvio, which incorporated a total of eight complete genomes. The dendrogram shows the phylogenetic relationship between the strains. The bars on the right of the dendrogram represent the number of singleton genes in each strain. The bar graph below the dendrogram shows the GC content of each strain.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-16-1537826-g002.tif"/>
</fig>
<p><xref ref-type="fig" rid="F3">Figure 3</xref> illustrates the open nature of the pangenome using different fitting models. A power-law fit to depict the cumulative number of genes discovered as more genomes are sampled (<xref ref-type="fig" rid="F3">Figure 3A</xref>). The steady slope in the fitted curve indicates continuous gene discovery, confirming that the pangenome remains open, as suggested by the equation y = 0.0917x + 0.0012y. Heap&#x2019;s law (<xref ref-type="fig" rid="F3">Figure 3B</xref>) shows the number of unique genes discovered with increasing genome samples and further reinforces the open pangenome model, as new unique genes continue to emerge with additional genome sampling.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p><bold>(A)</bold> The rarefaction curve illustrates the quantity of newly identified genes resulting from random additions to a single genome. The power-law fit equation is represented by &#x03B3; = 0.0917 &#x00B1; 0.0012. <bold>(B)</bold> Heap&#x2019;s Law plot illustrates the relationship between the number of genomes sampled and the number of unique genes identified in <italic>M. marinum</italic>. The fitted curve (red line) follows Heap&#x2019;s Law, with parameters k = 5427.124.76 and &#x03B3; = 0.169, indicating an open pangenome, where the number of unique genes increases as more genomes are sampled.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-16-1537826-g003.tif"/>
</fig>
</sec>
<sec id="S3.SS3">
<title>3.3 Genome synteny analysis and biomarker identification</title>
<p>The Mauve software was utilized to create a visual representation of gene synteny across the genomic sequences of various <italic>M. marinum</italic> strains, allowing for the identification of potential genetic rearrangements based on sequence similarity (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 3</xref>). The presence of gene blocks facilitated the detection of synteny, enabling the accurate identification of these regions. A comparative analysis of the genomes revealed several fragmented areas, characterized by multiple inversions and deletions. Notably, despite these disruptions, a high degree of uniformity was observed, with large, conserved segments exhibiting inversions and deletions when compared across the genomes.</p>
</sec>
<sec id="S3.SS4">
<title>3.4 Encoding genomic features</title>
<p>The Gene Ontology (GO) enrichment (<xref ref-type="fig" rid="F4">Figure 4</xref>) and KEGG pathway analysis (<xref ref-type="fig" rid="F5">Figure 5</xref>) of the <italic>M. marinum</italic> pangenome annotation, conducted through eggNOG and InterProScan, provide a comprehensive overview of the functional capabilities of the genes identified. The GO enrichment analysis reveals that biological processes like positive regulation of RNA biosynthetic processes, DNA-templated transcription, carbohydrate derivative biosynthesis, mitochondrial function, and cell adhesion are highly significant. These processes underscore key roles in cellular organization, metabolic activity, biosynthesis, and cell signaling. The negative regulation of nucleobase-containing compound metabolism and RNA metabolic processes also suggests intricate regulatory mechanisms at play in gene expression and metabolic control.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Gene Ontology (GO) enrichment analysis from the <italic>M. marinum</italic> pangenome annotation showing key biological processes.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-16-1537826-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>KEGG pathway enrichment analysis for the <italic>M. marinum</italic> pangenome annotation using eggNOG and InterProScan.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-16-1537826-g005.tif"/>
</fig>
<p>The KEGG pathway analysis highlights critical pathways including the PI3K-Akt and MAPK signaling pathways, both essential for cell survival, growth, and immune responses. Other enriched pathways like neuroactive ligand-receptor interaction, cytokine-cytokine receptor interaction, and calcium signaling pathways point to significant communication and signaling mechanisms that might play a role in host-pathogen interactions.</p>
<p>The virulence factor analysis of all the complete genomes identified several key virulence genes, highlighting important duplications: <italic>esxB, fbpC, fbpB, esxG, esxH, eccA3, eccC3, esxM, esxA, ideR, relA, hbhA, phoP</italic>, and <italic>mbtH</italic> (<xref ref-type="table" rid="T1">Table 1</xref>). Notably, the duplication of <italic>fbpB</italic> and <italic>fbpC</italic>, both associated with mycolyl transferase activity, suggests functional redundancy in adherence mechanisms. Additionally, the presence of multiple components of the Type VII secretion system, including <italic>esxB, esxG, esxH, eccA3</italic>, and <italic>eccC3</italic>, underscores the significance of this system in the virulence of <italic>M. marinum.</italic></p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Functional category of virulence genes in <italic>M. marinum</italic> pangenome.</p></caption>
<table cellspacing="5" cellpadding="5" frame="box" rules="all">
<thead>
<tr>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;">Gene functional category</td>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;">Virulence gene</td>
<td valign="top" align="left" style="color:#ffffff;background-color: #7f8080;">Product</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>esxB</italic></td>
<td valign="top" align="left">10 kDa culture filtrate antigen EsxB (CFP-10)</td>
</tr>
<tr>
<td valign="top" align="left">Adherence</td>
<td valign="top" align="left"><italic>fbpC</italic></td>
<td valign="top" align="left">Secreted antigen 85-C FbpC (85C) (antigen 85 complex C) (AG58C) (mycolyl transferase 85C) (fibronectin-binding protein C)</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>eccA3</italic></td>
<td valign="top" align="left">Type VII secretion system protein EccA3</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>eccC3</italic></td>
<td valign="top" align="left">Type VII secretion system protein EccC3</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>PE5</italic></td>
<td valign="top" align="left">PE family protein</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>esxG</italic></td>
<td valign="top" align="left">Type VII secretion system protein EsxG</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>esxH</italic></td>
<td valign="top" align="left">Type VII secretion system protein ESXH (10 kDa antigen) (CFP-7) (protein TB10.4)</td>
</tr>
<tr>
<td valign="top" align="left">Others</td>
<td valign="top" align="left"><italic>icl</italic></td>
<td valign="top" align="left">Isocitrate lyase Icl (isocitrase) (isocitratase)</td>
</tr>
<tr>
<td valign="top" align="left">Adherence</td>
<td valign="top" align="left"><italic>hbhA</italic></td>
<td valign="top" align="left">iron-regulated heparin binding hemagglutinin hbhA (adhesin)</td>
</tr>
<tr>
<td valign="top" align="left">Regulation</td>
<td valign="top" align="left"><italic>ideR</italic></td>
<td valign="top" align="left">Iron-dependent repressor and activator IdeR</td>
</tr>
<tr>
<td valign="top" align="left">Regulation</td>
<td valign="top" align="left"><italic>relA</italic></td>
<td valign="top" align="left">Probable GTP pyrophosphokinase RelA (ATP: GTP 3&#x2019;-pyrophosphotransferase) (PPGPP synthetase I) ((P)PPGPP synthetase) (GTP diphosphokinase)</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>esxM</italic></td>
<td valign="top" align="left">type VII secretion system ESX-5 protein EsxJ</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>esxN</italic></td>
<td valign="top" align="left">ESX-5 type VII secretion system EsxA (ESAT-6) homolog</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>Rv1794</italic></td>
<td valign="top" align="left">ESX-5 locus protein</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>eccD5</italic></td>
<td valign="top" align="left">ESX-5 type VII secretion system EccD5</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>mycP5</italic></td>
<td valign="top" align="left">ESX-5 type VII secretion system subtilisin-like serine protease MycP5</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>eccA5</italic></td>
<td valign="top" align="left">ESX-5 type VII secretion system AAA + ATPase EccA5</td>
</tr>
<tr>
<td valign="top" align="left">Adherence</td>
<td valign="top" align="left"><italic>fbpB</italic></td>
<td valign="top" align="left">Secreted antigen 85-B FbpB (85B) (antigen 85 complex B) (mycolyl transferase 85B) (fibronectin-binding protein B) (extracellular alpha-antigen)</td>
</tr>
<tr>
<td valign="top" align="left">Nutritional/Metabolic factor</td>
<td valign="top" align="left"><italic>mbtH</italic></td>
<td valign="top" align="left">MbtH-like protein</td>
</tr>
<tr>
<td valign="top" align="left">Regulation</td>
<td valign="top" align="left"><italic>phoP</italic></td>
<td valign="top" align="left">Possible two component system response transcriptional positive regulator PhoP</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>eccA1</italic></td>
<td valign="top" align="left">ESX-1 type VII secretion system AAA + ATPase EccA1</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>eccCa1</italic></td>
<td valign="top" align="left">ESX-1 type VII secretion system FtsK/SpoIIIE family protein EccCa1</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>eccCb1</italic></td>
<td valign="top" align="left">ESX-1 type VII secretion system FtsK/SpoIIIE family protein EccCb1</td>
</tr>
<tr>
<td valign="top" align="left">Effector delivery system</td>
<td valign="top" align="left"><italic>esxA</italic></td>
<td valign="top" align="left">6 kDa early secretory antigenic target EsxA (ESAT-6)</td>
</tr>
</tbody>
</table></table-wrap>
</sec>
<sec id="S3.SS5">
<title>3.5 Genomic plasticity identification</title>
<p>The RGP analysis of the pangenome of <italic>M. marinum</italic> revealed significant genomic diversity among the different strains. A total of 34 RGPs were identified in the study, with some RGPs present in multiple strains, indicating conservation among different strains. Notably, antimicrobial resistance genes, such as those conferring resistance to dibekacin, netilmicin, tobramycin, and Fosfomycin, were widespread among the strains. Additionally, antibiotic-resistant murA transferase, aminosalicylate resistant, and virulence factor genes were found to be co-localized in the same RGP, suggesting potential co-regulation. The analysis also identified several modules (or genes) that were present in multiple strains, including modules 26, 32, 28, 30, and 44. Strain-specific RGPs were also observed, with strain CCUG20998 having a unique RGP (RGP_0) and strain MMA1 having a unique RGP (RGP_14). Overall, the RGP analysis highlights the complex genomic landscape of <italic>M. marinum</italic> and the potential for co-regulation of antimicrobial resistance and virulence genes.</p>
</sec>
<sec id="S3.SS6">
<title>3.6 Gene gain-loss evaluation</title>
<p>The analysis of the open pangenome model reveals critical insights into the temporal dynamics of gene gain and loss events. The significant negative estimate of the &#x201C;core&#x201D; term (&#x2013;0.705, <italic>p</italic> = 1.02e-4), coupled with the narrow bootstrap confidence interval (&#x2013;1.15, &#x2013;0.255), indicates strong evidence for an open pangenome (<xref ref-type="fig" rid="F6">Figure 6</xref>). This suggests that gene gain and loss events are continuously accumulating over time, characteristic of an open system where new genes are incorporated as the genome evolves. The accumulation is not temporally limited, signifying ongoing horizontal gene transfer or gene acquisition from various sources, possibly through mobile genetic elements, which are typically associated with open pangenomes. Furthermore, the non-significant estimates for &#x201C;depth&#x201D; (estimate = &#x2013;0.0195, <italic>p</italic> = 4.62e-1) and &#x201C;tip&#x201D; (estimate = &#x2013;0.153, <italic>p</italic> = 4.31e-1) align with the expected pattern for an open pangenome. These results suggest that there are no substantial differences in detecting older gene exchange events or gene presence at the tips, reinforcing the idea that gene gain and loss occur throughout the evolutionary history of the genomes, not confined to specific time points. The non-significance of the dispersion term also implies that the rate and size of gene exchange events remain consistent, rather than varying dramatically between different branches of the phylogeny. The plot comparing cumulative gene gain and loss events against core branch distance shows distinct patterns for fast and slow-evolving pangenomes. The rapid accumulation of genes in the fast-evolving pangenome supports the interpretation of an open system, where more gene exchange events occur over shorter evolutionary timescales, especially along terminal branches, as indicated by the denser clustering (<xref ref-type="fig" rid="F6">Figure 6</xref>). This continuous acquisition of genes aligns with the expected behavior of an open pangenome, where there is no saturation point for gene gain, and new genes continue to enter the genome pool over time.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>Cumulative gene gain and loss events versus cumulative core branch distance for fast and slow-evolving pangenomes. The scatter plot distinguishes between internal branches (circles) and terminal branches (triangles), with &#x201C;fast&#x201D; pangenomes shown in red and &#x201C;slow&#x201D; pangenomes in blue. The steeper accumulation of gene gain and loss events in fast-evolving pangenomes, particularly along terminal branches, indicates an open pangenome with ongoing gene acquisition over time. The accompanying bar plots display the model estimates for the core, tip, and phi terms, with confidence intervals for both fast and slow pangenomes. The significant temporal signal in the core term suggests continuous gene flow in the open pangenome, whereas the non-significant depth and dispersion parameters reflect consistent gene exchange across the phylogeny.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-16-1537826-g006.tif"/>
</fig>
</sec>
<sec id="S3.SS7">
<title>3.7 Benchmarking annotation data</title>
<p>The benchmarking analysis presented in <xref ref-type="fig" rid="F7">Figure 7</xref> provides a comparative evaluation of EggNOG-mapper and InterProScan for annotating <italic>M. marinum</italic> genomes. <xref ref-type="fig" rid="F7">Figure 7A</xref> showing a higher proportion of true positive annotations for both tools, with EggNOG-mapper achieving 80% true positives compared to 70% for InterProScan. False positive rates are comparatively lower, indicating that both tools provide a reliable level of annotation accuracy, though EggNOG-mapper has an advantage. The average GO terms per protein, reveals that EggNOG-mapper assigns a higher average of curated (true positive) terms per protein, reflecting greater annotation specificity and comprehensiveness (<xref ref-type="fig" rid="F7">Figure 7B</xref>). InterProScan, while also providing curated terms, shows a slightly lower average, particularly in false positive and non-curated terms, which suggests a more conservative annotation approach. <xref ref-type="fig" rid="F7">Figure 7C</xref> demonstrating that both techniques offer substantial coverage exclusively with true positive (TP) annotations. EggNOG-mapper covers 60% of the proteome with TP terms only, whereas InterProScan covers 55%, indicating robust proteome-level annotation by both tools, though EggNOG-mapper marginally outperforms in exclusive TP coverage. Together, these results indicate that EggNOG-mapper provides a more extensive annotation profile across metrics, making it slightly more effective in annotation accuracy, specificity, and proteome coverage.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>Benchmarking of EggNOG-mapper and InterProScan annotation tools for <italic>M. marinum</italic>. <bold>(A)</bold> GO term accuracy showing proportions of true and false positives; <bold>(B)</bold> average GO terms per protein, categorized into curated terms; <bold>(C)</bold> proteome coverage indicating the percentage of proteins annotated with only true positives, a mix of true and false positives, or no true positives.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-16-1537826-g007.tif"/>
</fig>
</sec>
</sec>
<sec id="S4" sec-type="discussion">
<title>4 Discussion</title>
<p><italic>Mycobacterium marinum</italic> presents a zoonotic threat, causing granulomatous skin lesions and deeper tissue infections in humans (<xref ref-type="bibr" rid="B42">Petrini, 2006</xref>). Transmission typically occurs via contact with contaminated water (<xref ref-type="bibr" rid="B61">Tsai et al., 2007</xref>) or injuries from fish spines (<xref ref-type="bibr" rid="B28">Jernigan and Farr, 2000</xref>), presenting clinically as ulcers, nodular lymphangitis, or &#x2212; more severely &#x2212; tenosynovitis, arthritis, or osteomyelitis (<xref ref-type="bibr" rid="B67">Wongworawat et al., 2003</xref>). The disease spectrum ranges from self-limiting infections to chronic, treatment-resistant cases (<xref ref-type="bibr" rid="B3">Aubry et al., 2002</xref>), highlighting the need to characterize both conserved and emerging virulence factors and antibiotic resistance mechanisms.</p>
<p>This study provides significant insights into the genomic landscape and evolutionary dynamics of <italic>M. marinum</italic>, a pathogen capable of infecting both fish and humans. The consistently high ANI values (&#x2265; 98%) among strains from both hosts indicate a close genetic relationship, despite differences in host origin. These findings challenge previous observations by <xref ref-type="bibr" rid="B11">Das et al. (2018)</xref>, likely due to our use of complete genome sequences for comparative analysis, which offers a more precise and thorough understanding of an organism&#x2019;s genetic composition than analyses based on contigs, scaffolds, or chromosomes (<xref ref-type="bibr" rid="B65">Vasudevan et al., 2020</xref>). Our data suggest that <italic>M. marinum</italic> conserved survival and virulence mechanisms in diverse hosts, potentially making it as a generalist pathogen. The maintenance of such high genetic similarity across species further implies a strong evolutionary conservation of core biological functions, a trait shared by other pathogenic mycobacteria such as <italic>M. tuberculosis</italic> (<xref ref-type="bibr" rid="B18">Fisher, 2021</xref>). Moreover, the open nature of the <italic>M. marinum</italic> pangenome&#x2014;demonstrated by Heap&#x2019;s law and power-law fitting&#x2014;supports its high genomic plasticity. The gradual slope of the fitted curve indicates that the discovery of new genes is ongoing and will likely continue as more genomes are analyzed. This open pangenome model stands in contrasts to closed pangenomes, such as that of <italic>Bacillus anthracis</italic> (<xref ref-type="bibr" rid="B51">Selvaraj et al., 2021</xref>), where little to no new gene acquisition occurs. Additionally, the high number of strain-specific singleton genes in <italic>M. marinum</italic> further highlights its rapid genome evolution, likely driven by HGT (<xref ref-type="bibr" rid="B15">Dumas et al., 2016</xref>) and adaptation to diverse environmental stresses. These unique genes may confer strain-specific advantages, such as enhanced resistance to environmental pathogens (e.g., <italic>Pseudomonas aeruginosa</italic>), where strain-specific genes are linked to niche adaptation and virulence (<xref ref-type="bibr" rid="B30">Jurado-Mart&#x00ED;n et al., 2021</xref>).</p>
<p>This study presents the first benchmarking analysis of the <italic>M. marinum</italic> pangenome, validating the utility of pangenomic bioinformatic tools (<xref ref-type="bibr" rid="B64">van Dongen and Abreu-Goodger, 2012</xref>). The significant negative estimate of the &#x201C;core&#x201D; term (&#x2013;0.705, <italic>p</italic>-value = 1.02e-4) with a narrow bootstrap confidence interval (&#x2013;1.15 to &#x2013;0.255) confirms the presence of a robust open pangenome (<xref ref-type="bibr" rid="B57">Tokuda and Shintani, 2024</xref>). The non-significant estimates for &#x201C;depth&#x201D; (&#x2013;0.0195, <italic>p</italic>-value = 0.462) and &#x201C;istip&#x201D; (&#x2013;0.153, <italic>p</italic> = 0.431) further support the notion of continuous gene acquisition and loss throughout the pathogen&#x2019;s evolutionary history. Analysis of cumulative gene gain/loss events across core branch distances shows distinct patterns, differentiating fast- from slow-evolving pangenomes. The rapid accumulation of genes in fast-evolving pangenomes supports the interpretation of an open system, where increased gene exchange occurs over shorter evolutionary timescales. Furthermore, benchmarking annotation tools revealed that EggNOG-mapper&#x2019;s superiority in providing more comprehensive and accurate functional annotations for <italic>M. marinum</italic>, possibly attributable to its enormous annotation library and advanced prediction methods. While InterProScan remains precise, its conservative annotation approach results in fewer annotations, which may be preferred in studies prioritizing specificity.</p>
<p>Our comprehensive genomic analysis also highlighted critical virulence factors, particularly the <italic>ESX1</italic> secretion system. Similar to the findings reported in previous studies, all analyzed <italic>M. marinum</italic> strains exhibited partial duplication of the <italic>ESX1</italic> cluster, resulting in multiple copies of key virulence-associated genes, including <italic>esxA</italic> and <italic>esxB</italic> (<xref ref-type="bibr" rid="B19">Gao et al., 2004</xref>; <xref ref-type="bibr" rid="B54">Stinear et al., 2008</xref>). While <italic>esxA</italic> was conserved across all strains, truncated variants of <italic>esxB</italic> were common, indicating that <italic>esxB</italic> may be dispensable, whereas <italic>esxA</italic> appears crucial for virulence, in line with earlier reports (<xref ref-type="bibr" rid="B49">Rogall et al., 1990</xref>). Moreover, our study identified the existence of an additional <italic>ESX</italic> region &#x2212; designated <italic>ESX6</italic> &#x2212; including <italic>esxG, esxH, esxM</italic>, and <italic>esxN</italic>. The presence of these paralogs suggests compensatory mechanisms for virulence via gene conversion or epitope variation, as previously proposed (<xref ref-type="bibr" rid="B14">Derbyshire and Gray, 2014</xref>; <xref ref-type="bibr" rid="B63">Uplekar et al., 2011</xref>). This study is the first to report the presence of virulence-associated genes (e.g., <italic>mycP5, relA, fbpB, mbtH, phoP</italic>, and <italic>fbpC</italic>) in <italic>M. marinum</italic>. These genes are involved in effector delivery, stress response, nutrient acquisition, and host adherence, and likely contribute significantly to the pathogenic potential of <italic>M. marinum</italic>. The identification of gene duplications and the presence of paralogs suggest a complex evolutionary strategy aimed at maximizing adaptability and virulence. These insights not only reinforce previous studies but also contribute novel data regarding the virulence strategies employed by <italic>M. marinum</italic>, emphasizing the importance of <italic>ESX</italic> gene clusters in mycobacterial pathogenesis. While the current study sheds light on the potential of SNPs as genetic markers for pathogenicity and antibiotic resistance, future investigation should utilize high-fidelity sequencing platforms and orthogonal techniques. This is especially crucial given the variability in whole genome sequencing quality (e.g., depth, coverage, and error rates) associated with various technologies that may affect the accuracy of SNPs detection.</p>
<p>The analysis of RGP revealed extensive genomic diversity, identifying 34 RGPs, with some conserved across multiple strains. This marks the first detailed characterization of RGPs in <italic>M. marinum</italic> and highlights their role in environmental adaptation. Notably, antimicrobial resistance genes (e.g., dibekacin, netilmicin, tobramycin, and fosfomycin) were found co-localized with virulence genes such as <italic>esxB and esxA</italic>, suggesting possible co-regulation driven by HGT. Strain-specific RGPs, particularly in CCUG20998 and MMA1, reflect the pathogen&#x2019;s capacity for genomic adaptability of <italic>M. marinum</italic>. The co-localization of resistance and virulence determinants presents promising targets for therapeutic strategies (<xref ref-type="bibr" rid="B5">Beceiro et al., 2013</xref>; <xref ref-type="bibr" rid="B34">Lazar et al., 2023</xref>) and enhances our understanding of <italic>M. marinum</italic>&#x2019;s resilience in various environments.</p>
<p>In conclusion, this study demonstrates significant genomic and evolutionary insights with potential applications in diagnostic and aquaculture biosecurity. The identification of strain-specific SNPs in conserved genes provides a basis for developing rapid molecular diagnostics, including targeted PCR assays or CRISPR-based assays (<xref ref-type="bibr" rid="B35">Li et al., 2024</xref>). Similarly, conserved virulence genes could serve as biomarkers for multiplex qPCR aimed at detecting pathogenic strains in aquaculture systems (<xref ref-type="bibr" rid="B10">Chirakos et al., 2020</xref>; <xref ref-type="bibr" rid="B21">Gcebe et al., 2018</xref>). Furthermore, the co-occurrence of antibiotic resistance and virulence genes within RGPs highlights the urgent need for integrated surveillance strategies in both clinical and aquaculture settings. Future validation of these markers under field conditions will be critical to translating these findings into practical applications.</p>
</sec>
<sec id="S5" sec-type="conclusion">
<title>5 Conclusion</title>
<p>This study offers valuable genomic insights into <italic>Mycobacterium marinum</italic>, shedding light on its adaptability, virulence mechanisms, and potential as a generalist zoonotic pathogen. The high ANI values across strains, the open pangenome structure, and the abundance of singleton genes indicate ongoing evolution driven by gene acquisition and host adaptation. The identification of critical virulence factors, such as <italic>ESX</italic>1, <italic>ESX6</italic>, and novel genes like <italic>mycP5, relA</italic>, and <italic>fbpC</italic>, along with co-localized resistance genes in regions of RGPs, underscores the pathogen&#x2019;s genomic plasticity. These findings contribute to our understanding of <italic>M. marinum</italic> pathogenesis and play an important role for improved diagnostics, surveillance, and therapeutic strategies.</p>
</sec>
</body>
<back>
<sec id="S6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets analyzed during the current study are available in the National Center for Biotechnology Information (NCBI) (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov">https://www.ncbi.nlm.nih.gov</ext-link>). Details of the data retrieved from the NCBI database are included in <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>.</p>
</sec>
<sec id="S7" sec-type="author-contributions">
<title>Author contributions</title>
<p>KS: Data curation, Formal Analysis, Software, Writing &#x2013; original draft. SI: Conceptualization, Data curation, Funding acquisition, Methodology, Project administration, Supervision, Validation, Writing &#x2013; original draft, Writing &#x2013; review and editing. PS: Formal Analysis, Writing &#x2013; review and editing, Validation, Supervision. W-KJ: Methodology, Supervision, Validation, Writing &#x2013; review and editing. PP: Formal Analysis, Funding acquisition, Writing &#x2013; review and editing. NVL: Conceptualization, Formal Analysis, Data curation, Funding acquisition, Writing &#x2013; review and editing, Supervision, Validation.</p>
</sec>
<sec id="S8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work was funded by Bigbang International Project (No. #46349), Chiang Mai University.</p>
</sec>
<ack><p>We are thankful to BioMac Lab, Dhaka, Bangladesh for providing the technical support.</p>
</ack>
<sec id="S9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="S10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The authors declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec id="S11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="S12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2025.1537826/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmicb.2025.1537826/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Supplementary_file_1.docx" id="FS1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Supplementary_file_2.docx" id="TS1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/SethCommichaux/Heap_Law_for_Roary">https://github.com/SethCommichaux/Heap_Law_for_Roary</ext-link></p></fn>
<fn id="footnote2">
<label>2</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/pinbo/msa2snp">https://github.com/pinbo/msa2snp</ext-link></p></fn>
<fn id="footnote3">
<label>3</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/tseemann/abricate">https://github.com/tseemann/abricate</ext-link></p></fn>
<fn id="footnote4">
<label>4</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/labgem/PPanGGOLiN">https://github.com/labgem/PPanGGOLiN</ext-link></p></fn>
<fn id="footnote5">
<label>5</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/gtonkinhill/panstripe">https://github.com/gtonkinhill/panstripe</ext-link></p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Abdella</surname> <given-names>B.</given-names></name> <name><surname>Abozahra</surname> <given-names>N.</given-names></name> <name><surname>Shokrak</surname> <given-names>N.</given-names></name> <name><surname>Mohamed</surname> <given-names>R.</given-names></name> <name><surname>El-Helow</surname> <given-names>E.</given-names></name></person-group> (<year>2023</year>). <article-title>Whole spectrum of Aeromonas hydrophila virulence determinants and the identification of novel SNPs using comparative pathogenomics.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>13</volume>:<fpage>7712</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-023-34887-1</pub-id> <pub-id pub-id-type="pmid">37173388</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aronson</surname> <given-names>J. D.</given-names></name></person-group> (<year>1926</year>). <article-title>Spontaneous tuberculosis in salt water fish.</article-title> <source><italic>J. Infect. Dis.</italic></source> <volume>39</volume> <fpage>315</fpage>&#x2013;<lpage>320</lpage>. <pub-id pub-id-type="doi">10.1093/infdis/39.4.315</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aubry</surname> <given-names>A.</given-names></name> <name><surname>Chosidow</surname> <given-names>O.</given-names></name> <name><surname>Caumes</surname> <given-names>E.</given-names></name> <name><surname>Robert</surname> <given-names>J.</given-names></name> <name><surname>Cambau</surname> <given-names>E.</given-names></name></person-group> (<year>2002</year>). <article-title>Sixty-three cases of Mycobacterium marinum infection: Clinical features, treatment, and antibiotic susceptibility of causative isolates.</article-title> <source><italic>Arch. Intern. Med.</italic></source> <volume>162</volume> <fpage>1746</fpage>&#x2013;<lpage>1752</lpage>. <pub-id pub-id-type="doi">10.1001/archinte.162.15.1746</pub-id> <pub-id pub-id-type="pmid">12153378</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aubry</surname> <given-names>A.</given-names></name> <name><surname>Mougari</surname> <given-names>F.</given-names></name> <name><surname>Reibel</surname> <given-names>F.</given-names></name> <name><surname>Cambau</surname> <given-names>E.</given-names></name></person-group> (<year>2017</year>). &#x201C;<article-title>Mycobacterium marinum</article-title>&#x201D;, in <source><italic>Tuberculosis and Nontuberculous Mycobacterial Infections</italic></source>, <role>ed.</role> D. Schlossberg, <pub-id pub-id-type="doi">10.1128/9781555819866.ch43</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beceiro</surname> <given-names>A.</given-names></name> <name><surname>Tom&#x00E1;s</surname> <given-names>M.</given-names></name> <name><surname>Bou</surname> <given-names>G.</given-names></name></person-group> (<year>2013</year>). <article-title>Antimicrobial resistance and virulence: A successful or deleterious association in the bacterial world?</article-title> <source><italic>Clin. Microbiol. Rev.</italic></source> <volume>26</volume> <fpage>185</fpage>&#x2013;<lpage>230</lpage>. <pub-id pub-id-type="doi">10.1128/CMR.00059-12</pub-id> <pub-id pub-id-type="pmid">23554414</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beecham</surname> <given-names>H.</given-names></name> <name><surname>Oldfield</surname> <given-names>E.</given-names></name> <name><surname>Lewis</surname> <given-names>D.</given-names></name> <name><surname>Buker</surname> <given-names>J.</given-names></name></person-group> (<year>1991</year>). <article-title>Mycobacterium marinum infection from shucking oysters.</article-title> <source><italic>Lancet</italic></source> <volume>337</volume>:<fpage>1487</fpage>. <pub-id pub-id-type="doi">10.1016/0140-6736(91)93183-a</pub-id> <pub-id pub-id-type="pmid">1675357</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Camacho</surname> <given-names>C.</given-names></name> <name><surname>Coulouris</surname> <given-names>G.</given-names></name> <name><surname>Avagyan</surname> <given-names>V.</given-names></name> <name><surname>Ma</surname> <given-names>N.</given-names></name> <name><surname>Papadopoulos</surname> <given-names>J.</given-names></name> <name><surname>Bealer</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>BLAST+: Architecture and applications.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>10</volume>:<fpage>421</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-10-421</pub-id> <pub-id pub-id-type="pmid">20003500</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cantalapiedra</surname> <given-names>C.</given-names></name> <name><surname>Hern&#x00E1;ndez-Plaza</surname> <given-names>A.</given-names></name> <name><surname>Letunic</surname> <given-names>I.</given-names></name> <name><surname>Bork</surname> <given-names>P.</given-names></name> <name><surname>Huerta-Cepas</surname> <given-names>J.</given-names></name></person-group> (<year>2021</year>). <article-title>eggNOG-mapper v2: Functional annotation, orthology assignments, and domain prediction at the metagenomic scale.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>38</volume> <fpage>5825</fpage>&#x2013;<lpage>5829</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msab293</pub-id> <pub-id pub-id-type="pmid">34597405</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cardenal-Mu&#x00F1;oz</surname> <given-names>E.</given-names></name> <name><surname>Barisch</surname> <given-names>C.</given-names></name> <name><surname>Lefran&#x00E7;ois</surname> <given-names>L.</given-names></name> <name><surname>L&#x00F3;pez-Jim&#x00E9;nez</surname> <given-names>A.</given-names></name> <name><surname>Soldati</surname> <given-names>T.</given-names></name></person-group> (<year>2018</year>). <article-title>When dicty met myco, a (not so) romantic story about one amoeba and its intracellular pathogen.</article-title> <source><italic>Front. Cell. Infect. Microbiol.</italic></source> <volume>7</volume>:<fpage>529</fpage>. <pub-id pub-id-type="doi">10.3389/fcimb.2017.00529</pub-id> <pub-id pub-id-type="pmid">29376033</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chirakos</surname> <given-names>A.</given-names></name> <name><surname>Balaram</surname> <given-names>A.</given-names></name> <name><surname>Conrad</surname> <given-names>W.</given-names></name> <name><surname>Champion</surname> <given-names>P.</given-names></name></person-group> (<year>2020</year>). <article-title>Modeling tubercular ESX-1 secretion using Mycobacterium marinum.</article-title> <source><italic>Microbiol. Mol. Biol. Rev.</italic></source> <volume>84</volume>:<fpage>e00082-19</fpage>. <pub-id pub-id-type="doi">10.1128/MMBR.00082-19</pub-id> <pub-id pub-id-type="pmid">32878966</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Das</surname> <given-names>S.</given-names></name> <name><surname>Pettersson</surname> <given-names>B.</given-names></name> <name><surname>Behra</surname> <given-names>P.</given-names></name> <name><surname>Mallick</surname> <given-names>A.</given-names></name> <name><surname>Cheramie</surname> <given-names>M.</given-names></name> <name><surname>Ramesh</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Extensive genomic diversity among Mycobacterium marinum strains revealed by whole genome sequencing.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>8</volume>:<fpage>12040</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-018-30152-y</pub-id> <pub-id pub-id-type="pmid">30104693</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dauendorffer</surname> <given-names>J.</given-names></name> <name><surname>Guillemin</surname> <given-names>I.</given-names></name> <name><surname>Aubry</surname> <given-names>A.</given-names></name> <name><surname>Truffot-Pernot</surname> <given-names>C.</given-names></name> <name><surname>Sougakoff</surname> <given-names>W.</given-names></name> <name><surname>Jarlier</surname> <given-names>V.</given-names></name><etal/></person-group> (<year>2003</year>). <article-title>Identification of mycobacterial species by PCR sequencing of quinolone resistance-determining regions of DNA gyrase genes.</article-title> <source><italic>J. Clin. Microbiol.</italic></source> <volume>41</volume> <fpage>1311</fpage>&#x2013;<lpage>1315</lpage>. <pub-id pub-id-type="doi">10.1128/JCM.41.3.1311-1315.2003</pub-id> <pub-id pub-id-type="pmid">12624075</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>de Man</surname> <given-names>T.</given-names></name> <name><surname>Limbago</surname> <given-names>B. M.</given-names></name></person-group> (<year>2016</year>). <article-title>SSTAR, a stand-alone easy-to-use antimicrobial resistance gene predictor.</article-title> <source><italic>mSphere</italic></source> <volume>1</volume>:<fpage>e00050-15</fpage>. <pub-id pub-id-type="doi">10.1128/mSphere.00050-15</pub-id> <pub-id pub-id-type="pmid">27303709</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Derbyshire</surname> <given-names>K.</given-names></name> <name><surname>Gray</surname> <given-names>T.</given-names></name></person-group> (<year>2014</year>). <article-title>Distributive conjugal transfer: New insights into horizontal gene transfer and genetic exchange in mycobacteria.</article-title> <source><italic>Microbiol. Spectr.</italic></source> <volume>2</volume>:<fpage>4</fpage>. <pub-id pub-id-type="doi">10.1128/microbiolspec.MGM2-0022-2013</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dumas</surname> <given-names>E.</given-names></name> <name><surname>Christina Boritsch</surname> <given-names>E.</given-names></name> <name><surname>Vandenbogaert</surname> <given-names>M.</given-names></name> <name><surname>Rodr&#x00ED;guez de la Vega</surname> <given-names>R. C.</given-names></name> <name><surname>Thiberge</surname> <given-names>J. M.</given-names></name> <name><surname>Caro</surname> <given-names>V.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Mycobacterial pan-genome analysis suggests important role of plasmids in the radiation of type VII secretion systems.</article-title> <source><italic>Genome Biol. Evol.</italic></source> <volume>8</volume> <fpage>387</fpage>&#x2013;<lpage>402</lpage>. <pub-id pub-id-type="doi">10.1093/gbe/evw001</pub-id> <pub-id pub-id-type="pmid">26748339</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Edwards</surname> <given-names>D.</given-names></name> <name><surname>Holt</surname> <given-names>K.</given-names></name></person-group> (<year>2013</year>). <article-title>Beginner&#x2019;s guide to comparative bacterial genome analysis using next-generation sequence data.</article-title> <source><italic>Microb. Inform. Exp.</italic></source> <volume>3</volume>:<fpage>2</fpage>. <pub-id pub-id-type="doi">10.1186/2042-5783-3-2</pub-id> <pub-id pub-id-type="pmid">23575213</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eren</surname> <given-names>A.</given-names></name> <name><surname>Esen</surname> <given-names>&#x00D6;C.</given-names></name> <name><surname>Quince</surname> <given-names>C.</given-names></name> <name><surname>Vineis</surname> <given-names>J. H.</given-names></name> <name><surname>Morrison</surname> <given-names>H. G.</given-names></name> <name><surname>Sogin</surname> <given-names>M. L.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Anvi&#x2019;o: An advanced analysis and visualization platform for &#x2019;omics data.</article-title> <source><italic>PeerJ</italic></source> <volume>3</volume>:<fpage>e1319</fpage>. <pub-id pub-id-type="doi">10.7717/peerj.1319</pub-id> <pub-id pub-id-type="pmid">26500826</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fisher</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>The evolutionary impact of population size, mutation rate and virulence on pathogen niche width.</article-title> <source><italic>J. Evol. Biol.</italic></source> <volume>34</volume> <fpage>1256</fpage>&#x2013;<lpage>1265</lpage>. <pub-id pub-id-type="doi">10.1111/jeb.13882</pub-id> <pub-id pub-id-type="pmid">34101932</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gao</surname> <given-names>L.</given-names></name> <name><surname>Guo</surname> <given-names>S.</given-names></name> <name><surname>McLaughlin</surname> <given-names>B.</given-names></name> <name><surname>Morisaki</surname> <given-names>H.</given-names></name> <name><surname>Engel</surname> <given-names>J.</given-names></name> <name><surname>Brown</surname> <given-names>E. J.</given-names></name></person-group> (<year>2004</year>). <article-title>A mycobacterial virulence gene cluster extending RD1 is required for cytolysis, bacterial spreading and ESAT-6 secretion.</article-title> <source><italic>Mol. Microbiol.</italic></source> <volume>53</volume> <fpage>1677</fpage>&#x2013;<lpage>1693</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2958.2004.04261.x</pub-id> <pub-id pub-id-type="pmid">15341647</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gautreau</surname> <given-names>G.</given-names></name> <name><surname>Bazin</surname> <given-names>A.</given-names></name> <name><surname>Gachet</surname> <given-names>M.</given-names></name> <name><surname>Planel</surname> <given-names>R.</given-names></name> <name><surname>Burlot</surname> <given-names>L.</given-names></name> <name><surname>Dubois</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>PPanGGOLiN: Depicting microbial diversity via a partitioned pangenome graph.</article-title> <source><italic>PLoS Comput. Biol.</italic></source> <volume>16</volume>:<fpage>e1007732</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1007732</pub-id> <pub-id pub-id-type="pmid">32191703</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gcebe</surname> <given-names>N.</given-names></name> <name><surname>Michel</surname> <given-names>A.</given-names></name> <name><surname>Hlokwe</surname> <given-names>T.</given-names></name></person-group> (<year>2018</year>). <article-title>Non-tuberculous Mycobacterium species causing mycobacteriosis in farmed aquatic animals of South Africa.</article-title> <source><italic>BMC Microbiol.</italic></source> <volume>18</volume>:<fpage>32</fpage>. <pub-id pub-id-type="doi">10.1186/s12866-018-1177-9</pub-id> <pub-id pub-id-type="pmid">29653505</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><collab>Gene Ontology Consortium.</collab> (<year>2015</year>). <article-title>Gene ontology consortium: Going forward.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>D1049</fpage>&#x2013;<lpage>D1056</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gku1179</pub-id> <pub-id pub-id-type="pmid">25428369</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Goris</surname> <given-names>J.</given-names></name> <name><surname>Konstantinidis</surname> <given-names>K.</given-names></name> <name><surname>Klappenbach</surname> <given-names>J.</given-names></name> <name><surname>Coenye</surname> <given-names>T.</given-names></name> <name><surname>Vandamme</surname> <given-names>P.</given-names></name> <name><surname>Tiedje</surname> <given-names>J. M.</given-names></name></person-group> (<year>2007</year>). <article-title>DNA-DNA hybridization values and their relationship to whole-genome sequence similarities.</article-title> <source><italic>Int. J. Syst. Evol. Microbiol.</italic></source> <volume>57</volume> <fpage>81</fpage>&#x2013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.1099/ijs.0.64483-0</pub-id> <pub-id pub-id-type="pmid">17220447</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Horsfield</surname> <given-names>S.</given-names></name> <name><surname>Tonkin-Hill</surname> <given-names>G.</given-names></name> <name><surname>Croucher</surname> <given-names>N.</given-names></name> <name><surname>Lees</surname> <given-names>J.</given-names></name></person-group> (<year>2023</year>). <article-title>Accurate and fast graph-based pangenome annotation and clustering with ggCaller.</article-title> <source><italic>Genome Res.</italic></source> <volume>33</volume> <fpage>1622</fpage>&#x2013;<lpage>1637</lpage>. <pub-id pub-id-type="doi">10.1101/gr.277733.123</pub-id> <pub-id pub-id-type="pmid">37620118</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huerta-Cepas</surname> <given-names>J.</given-names></name> <name><surname>Forslund</surname> <given-names>K.</given-names></name> <name><surname>Coelho</surname> <given-names>L.</given-names></name> <name><surname>Szklarczyk</surname> <given-names>D.</given-names></name> <name><surname>Jensen</surname> <given-names>L.</given-names></name> <name><surname>von Mering</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Fast genome-wide functional annotation through orthology assignment by eggNOG-mapper.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>34</volume> <fpage>2115</fpage>&#x2013;<lpage>2122</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msx148</pub-id> <pub-id pub-id-type="pmid">28460117</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hyatt</surname> <given-names>D.</given-names></name> <name><surname>Chen</surname> <given-names>G.</given-names></name> <name><surname>Locascio</surname> <given-names>P.</given-names></name> <name><surname>Land</surname> <given-names>M.</given-names></name> <name><surname>Larimer</surname> <given-names>F.</given-names></name> <name><surname>Hauser</surname> <given-names>L.</given-names></name></person-group> (<year>2010</year>). <article-title>Prodigal: Prokaryotic gene recognition and translation initiation site identification.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>11</volume>:<fpage>119</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-11-119</pub-id> <pub-id pub-id-type="pmid">20211023</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Islam</surname> <given-names>S.</given-names></name> <name><surname>Shahed</surname> <given-names>K.</given-names></name> <name><surname>Ahamed</surname> <given-names>M.</given-names></name> <name><surname>Khang</surname> <given-names>L.</given-names></name> <name><surname>Jung</surname> <given-names>W.</given-names></name> <name><surname>Sangsawad</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2025</year>). <article-title>Pathogenomic insights into piscirickettsia salmonis with a focus on virulence factors, single-nucleotide polymorphism identification, and resistance dynamics.</article-title> <source><italic>Animals (Basel)</italic></source> <volume>15</volume>:<fpage>1176</fpage>. <pub-id pub-id-type="doi">10.3390/ani15081176</pub-id> <pub-id pub-id-type="pmid">40282010</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jernigan</surname> <given-names>J.</given-names></name> <name><surname>Farr</surname> <given-names>B.</given-names></name></person-group> (<year>2000</year>). <article-title>Incubation period and sources of exposure for cutaneous Mycobacterium marinum infection: Case report and review of the literature.</article-title> <source><italic>Clin. Infect. Dis.</italic></source> <volume>31</volume> <fpage>439</fpage>&#x2013;<lpage>443</lpage>. <pub-id pub-id-type="doi">10.1086/313972</pub-id> <pub-id pub-id-type="pmid">10987702</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jin</surname> <given-names>L.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Yang</surname> <given-names>W.</given-names></name> <name><surname>Qiao</surname> <given-names>Z.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name></person-group> (<year>2020</year>). <article-title>Complete genome sequence of fish-pathogenic Aeromonas hydrophila HX-3 and a comparative analysis: Insights into virulence factors and quorum sensing.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>10</volume>:<fpage>15479</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-72484-8</pub-id> <pub-id pub-id-type="pmid">32968153</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jurado-Mart&#x00ED;n</surname> <given-names>I.</given-names></name> <name><surname>Sainz-Mej&#x00ED;as</surname> <given-names>M.</given-names></name> <name><surname>McClean</surname> <given-names>S.</given-names></name></person-group> (<year>2021</year>). <article-title>Pseudomonas aeruginosa: An audacious pathogen with an adaptable arsenal of virulence factors.</article-title> <source><italic>Int. J. Mol. Sci.</italic></source> <volume>22</volume>:<fpage>3128</fpage>. <pub-id pub-id-type="doi">10.3390/ijms22063128</pub-id> <pub-id pub-id-type="pmid">33803907</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kanehisa</surname> <given-names>M.</given-names></name> <name><surname>Furumichi</surname> <given-names>M.</given-names></name> <name><surname>Tanabe</surname> <given-names>M.</given-names></name> <name><surname>Sato</surname> <given-names>Y.</given-names></name> <name><surname>Morishima</surname> <given-names>K.</given-names></name></person-group> (<year>2017</year>). <article-title>KEGG new perspectives on genomes, pathways, diseases and drugs.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>45</volume> <fpage>D353</fpage>&#x2013;<lpage>D361</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw1092</pub-id> <pub-id pub-id-type="pmid">27899662</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kurokawa</surname> <given-names>S.</given-names></name> <name><surname>Kabayama</surname> <given-names>J.</given-names></name> <name><surname>Hwang</surname> <given-names>S.</given-names></name> <name><surname>Nho</surname> <given-names>S.</given-names></name> <name><surname>Hikima</surname> <given-names>J.</given-names></name> <name><surname>Jung</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Comparative genome analysis of fish and human isolates of Mycobacterium marinum.</article-title> <source><italic>Mar. Biotechnol.</italic></source> <volume>15</volume> <fpage>596</fpage>&#x2013;<lpage>605</lpage>. <pub-id pub-id-type="doi">10.1007/s10126-013-9511-6</pub-id> <pub-id pub-id-type="pmid">23728847</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kurtz</surname> <given-names>S.</given-names></name> <name><surname>Phillippy</surname> <given-names>A.</given-names></name> <name><surname>Delcher</surname> <given-names>A.</given-names></name> <name><surname>Smoot</surname> <given-names>M.</given-names></name> <name><surname>Shumway</surname> <given-names>M.</given-names></name> <name><surname>Antonescu</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2004</year>). <article-title>Versatile and open software for comparing large genomes.</article-title> <source><italic>Genome Biol.</italic></source> <volume>5</volume>:<fpage>R12</fpage>. <pub-id pub-id-type="doi">10.1186/gb-2004-5-2-r12</pub-id> <pub-id pub-id-type="pmid">14759262</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lazar</surname> <given-names>V.</given-names></name> <name><surname>Oprea</surname> <given-names>E.</given-names></name> <name><surname>Ditu</surname> <given-names>L.</given-names></name></person-group> (<year>2023</year>). <article-title>Resistance, tolerance, virulence and bacterial pathogen fitness-current state and envisioned solutions for the near future.</article-title> <source><italic>Pathogens</italic></source> <volume>12</volume>:<fpage>746</fpage>. <pub-id pub-id-type="doi">10.3390/pathogens12050746</pub-id> <pub-id pub-id-type="pmid">37242416</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Feng</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>D.</given-names></name> <name><surname>Shi</surname> <given-names>D.</given-names></name> <name><surname>Chen</surname> <given-names>G. A.</given-names></name></person-group> (<year>2024</year>). <article-title>Rapid PCR-based diagnostic method for skin infection with Mycobacterium marinum.</article-title> <source><italic>Infect. Drug Resist.</italic></source> <volume>17</volume> <fpage>2833</fpage>&#x2013;<lpage>2851</lpage>. <pub-id pub-id-type="doi">10.2147/IDR.S463798</pub-id> <pub-id pub-id-type="pmid">39005849</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>B.</given-names></name> <name><surname>Zheng</surname> <given-names>D.</given-names></name> <name><surname>Zhou</surname> <given-names>S.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name></person-group> (<year>2022</year>). <article-title>VFDB 2022: A general classification scheme for bacterial virulence factors.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>50</volume> <fpage>D912</fpage>&#x2013;<lpage>D917</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkab1107</pub-id> <pub-id pub-id-type="pmid">34850947</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mahmoud</surname> <given-names>N. H.</given-names></name> <name><surname>Elsherbiny</surname> <given-names>B. A.</given-names></name> <name><surname>Moffit</surname> <given-names>S. M.</given-names></name> <name><surname>Mohamed</surname> <given-names>J. H.</given-names></name> <name><surname>Abouelkheir</surname> <given-names>S. S.</given-names></name> <name><surname>Abdella</surname> <given-names>B.</given-names></name></person-group> (<year>2022</year>). &#x201C;<article-title>Cell biology and microbial interactions in algal cells</article-title>,&#x201D; in <source><italic>Handbook of research on algae as a sustainable solution for food, energy, and the environment</italic></source>, <publisher-loc>Pennsylvania</publisher-loc>: <publisher-name>IGI Global</publisher-name>. <fpage>84</fpage>&#x2013;<lpage>108</lpage>. <pub-id pub-id-type="doi">10.4018/978-1-6684-2438-4.ch004</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mwamburi</surname> <given-names>S.</given-names></name> <name><surname>Islam</surname> <given-names>S.</given-names></name> <name><surname>Dinh-Hung</surname> <given-names>N.</given-names></name> <name><surname>Dangsawat</surname> <given-names>O.</given-names></name> <name><surname>Sowanpreecha</surname> <given-names>R.</given-names></name> <name><surname>Khang</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2024</year>). <article-title>Genomic characterization of Bacillus sp. THPS1: A hot spring-derived species with functional features and biotechnological potential.</article-title> <source><italic>Microorganisms</italic></source> <volume>12</volume>:<fpage>2476</fpage>. <pub-id pub-id-type="doi">10.3390/microorganisms12122476</pub-id> <pub-id pub-id-type="pmid">39770679</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Page</surname> <given-names>A.</given-names></name> <name><surname>Cummins</surname> <given-names>C.</given-names></name> <name><surname>Hunt</surname> <given-names>M.</given-names></name> <name><surname>Wong</surname> <given-names>V.</given-names></name> <name><surname>Reuter</surname> <given-names>S.</given-names></name> <name><surname>Holden</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Roary: Rapid large-scale prokaryote pan genome analysis.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>3691</fpage>&#x2013;<lpage>3693</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv421</pub-id> <pub-id pub-id-type="pmid">26198102</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parks</surname> <given-names>D.</given-names></name> <name><surname>Imelfort</surname> <given-names>M.</given-names></name> <name><surname>Skennerton</surname> <given-names>C.</given-names></name> <name><surname>Hugenholtz</surname> <given-names>P.</given-names></name> <name><surname>Tyson</surname> <given-names>G.</given-names></name></person-group> (<year>2022</year>). <article-title>CheckM: Assessing the quality of microbial genomes recovered from isolates, single cells, and metagenomes.</article-title> <source><italic>Genome Res.</italic></source> <volume>25</volume> <fpage>1043</fpage>&#x2013;<lpage>1055</lpage>. <pub-id pub-id-type="doi">10.1101/gr.186072.114</pub-id> <pub-id pub-id-type="pmid">25977477</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>P&#x00E9;rez-Pascual</surname> <given-names>D.</given-names></name> <name><surname>Lunazzi</surname> <given-names>A.</given-names></name> <name><surname>Magdelenat</surname> <given-names>G.</given-names></name> <name><surname>Rouy</surname> <given-names>Z.</given-names></name> <name><surname>Roulet</surname> <given-names>A.</given-names></name> <name><surname>Lopez-Roques</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>The complete genome sequence of the fish pathogen tenacibaculum maritimum provides insights into virulence mechanisms.</article-title> <source><italic>Microbiol.</italic></source> <volume>8</volume>:<fpage>1542</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2017.01542</pub-id> <pub-id pub-id-type="pmid">28861057</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Petrini</surname> <given-names>B.</given-names></name></person-group> (<year>2006</year>). <article-title>Mycobacterium marinum: Ubiquitous agent of waterborne granulomatous skin infections.</article-title> <source><italic>Eur. J. Clin. Microbiol. Infect. Dis.</italic></source> <volume>25</volume> <fpage>609</fpage>&#x2013;<lpage>613</lpage>. <pub-id pub-id-type="doi">10.1007/s10096-006-0201-4</pub-id> <pub-id pub-id-type="pmid">17047903</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Podrzaj</surname> <given-names>L.</given-names></name> <name><surname>Burtscher</surname> <given-names>J.</given-names></name> <name><surname>Domig</surname> <given-names>K.</given-names></name></person-group> (<year>2022</year>). <article-title>Comparative genomics provides insights into genetic diversity of Clostridium tyrobutyricum and potential implications for late blowing defects in cheese.</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>13</volume>:<fpage>889551</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2022.889551</pub-id> <pub-id pub-id-type="pmid">35722315</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Quevillon</surname> <given-names>E.</given-names></name> <name><surname>Silventoinen</surname> <given-names>V.</given-names></name> <name><surname>Pillai</surname> <given-names>S.</given-names></name> <name><surname>Harte</surname> <given-names>N.</given-names></name> <name><surname>Mulder</surname> <given-names>N.</given-names></name> <name><surname>Apweiler</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2005</year>). <article-title>InterProScan: Protein domains identifier.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>33</volume> <fpage>W116</fpage>&#x2013;<lpage>W120</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gki442</pub-id> <pub-id pub-id-type="pmid">15980438</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rajput</surname> <given-names>A.</given-names></name> <name><surname>Chauhan</surname> <given-names>S.</given-names></name> <name><surname>Mohite</surname> <given-names>O.</given-names></name> <name><surname>Hyun</surname> <given-names>J.</given-names></name> <name><surname>Ardalani</surname> <given-names>O.</given-names></name> <name><surname>Jahn</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2023</year>). <article-title>Pangenome analysis reveals the genetic basis for taxonomic classification of the Lactobacillaceae family.</article-title> <source><italic>Food Microbiol.</italic></source> <volume>115</volume>:<fpage>104334</fpage>. <pub-id pub-id-type="doi">10.1016/j.fm.2023.104334</pub-id> <pub-id pub-id-type="pmid">37567624</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ramakrishnan</surname> <given-names>L.</given-names></name> <name><surname>Falkow</surname> <given-names>S.</given-names></name></person-group> (<year>1994</year>). <article-title>Mycobacterium marinum persists in cultured mammalian cells in a temperature-restricted fashion.</article-title> <source><italic>Infect. Immun.</italic></source> <volume>62</volume> <fpage>3222</fpage>&#x2013;<lpage>3229</lpage>. <pub-id pub-id-type="doi">10.1128/iai.62.8.3222-3229.1994</pub-id> <pub-id pub-id-type="pmid">8039892</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reis</surname> <given-names>A.</given-names></name> <name><surname>Cunha</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>The open pan-genome architecture and virulence landscape of Mycobacterium bovis.</article-title> <source><italic>Genom</italic></source> <volume>7</volume>:<fpage>000664</fpage>. <pub-id pub-id-type="doi">10.1099/mgen.0.000664</pub-id> <pub-id pub-id-type="pmid">34714230</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Richter</surname> <given-names>M.</given-names></name> <name><surname>Rossell&#x00F3;-M&#x00F3;ra</surname> <given-names>R.</given-names></name></person-group> (<year>2009</year>). <article-title>Shifting the genomic gold standard for the prokaryotic species definition.</article-title> <source><italic>Proc. Natl. Acad. Sci. U S A.</italic></source> <volume>106</volume> <fpage>19126</fpage>&#x2013;<lpage>19131</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0906412106</pub-id> <pub-id pub-id-type="pmid">19855009</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rogall</surname> <given-names>T.</given-names></name> <name><surname>Wolters</surname> <given-names>J.</given-names></name> <name><surname>Flohr</surname> <given-names>T.</given-names></name> <name><surname>B&#x00F6;ttger</surname> <given-names>E.</given-names></name></person-group> (<year>1990</year>). <article-title>Towards a phylogeny and definition of species at the molecular level within the genus Mycobacterium.</article-title> <source><italic>Int. J. Syst. Bacteriol.</italic></source> <volume>40</volume> <fpage>323</fpage>&#x2013;<lpage>330</lpage>. <pub-id pub-id-type="doi">10.1099/00207713-40-4-323</pub-id> <pub-id pub-id-type="pmid">2275850</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ruley</surname> <given-names>K.</given-names></name> <name><surname>Ansede</surname> <given-names>J.</given-names></name> <name><surname>Pritchett</surname> <given-names>C.</given-names></name> <name><surname>Talaat</surname> <given-names>A.</given-names></name> <name><surname>Reimschuessel</surname> <given-names>R.</given-names></name> <name><surname>Trucksis</surname> <given-names>M.</given-names></name></person-group> (<year>2004</year>). <article-title>Identification of Mycobacterium marinum virulence genes using signature-tagged mutagenesis and the goldfish model of mycobacterial pathogenesis.</article-title> <source><italic>FEMS Microbiol. Lett.</italic></source> <volume>232</volume> <fpage>75</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/S0378-1097(04)00017-5</pub-id> <pub-id pub-id-type="pmid">15019737</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Selvaraj</surname> <given-names>C.</given-names></name> <name><surname>Selvaraj</surname> <given-names>G.</given-names></name> <name><surname>Mohamed Ismail</surname> <given-names>R.</given-names></name> <name><surname>Vijayakumar</surname> <given-names>R.</given-names></name> <name><surname>Baazeem</surname> <given-names>A.</given-names></name> <name><surname>Wei</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Interrogation of Bacillus anthracis SrtA active site loop forming open/close lid conformations through extensive MD simulations for understanding binding selectivity of SrtA inhibitors.</article-title> <source><italic>Saudi J. Biol. Sci.</italic></source> <volume>28</volume> <fpage>3650</fpage>&#x2013;<lpage>3659</lpage>. <pub-id pub-id-type="doi">10.1016/j.sjbs.2021.05.009</pub-id> <pub-id pub-id-type="pmid">34220215</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Soares</surname> <given-names>S.</given-names></name> <name><surname>Silva</surname> <given-names>A.</given-names></name> <name><surname>Trost</surname> <given-names>E.</given-names></name> <name><surname>Blom</surname> <given-names>J.</given-names></name> <name><surname>Ramos</surname> <given-names>R.</given-names></name> <name><surname>Carneiro</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>The pan-genome of the animal pathogen Corynebacterium pseudotuberculosis reveals differences in genome plasticity between the biovar ovis and equi strains.</article-title> <source><italic>PLoS One</italic></source> <volume>8</volume>:<fpage>e53818</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0053818</pub-id> <pub-id pub-id-type="pmid">23342011</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stinear</surname> <given-names>T.</given-names></name> <name><surname>Jenkin</surname> <given-names>G.</given-names></name> <name><surname>Johnson</surname> <given-names>P.</given-names></name> <name><surname>Davies</surname> <given-names>J.</given-names></name></person-group> (<year>2000</year>). <article-title>Comparative genetic analysis of Mycobacterium ulcerans and Mycobacterium marinum reveals evidence of recent divergence.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>182</volume> <fpage>6322</fpage>&#x2013;<lpage>6330</lpage>. <pub-id pub-id-type="doi">10.1128/JB.182.22.6322-6330.2000</pub-id> <pub-id pub-id-type="pmid">11053375</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stinear</surname> <given-names>T.</given-names></name> <name><surname>Seemann</surname> <given-names>T.</given-names></name> <name><surname>Harrison</surname> <given-names>P.</given-names></name> <name><surname>Jenkin</surname> <given-names>G.</given-names></name> <name><surname>Davies</surname> <given-names>J.</given-names></name> <name><surname>Johnson</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Insights from the complete genome sequence of Mycobacterium marinum on the evolution of Mycobacterium tuberculosis.</article-title> <source><italic>Genome Res.</italic></source> <volume>18</volume> <fpage>729</fpage>&#x2013;<lpage>741</lpage>. <pub-id pub-id-type="doi">10.1101/gr.075069.107</pub-id> <pub-id pub-id-type="pmid">18403782</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tatusov</surname> <given-names>R.</given-names></name> <name><surname>Galperin</surname> <given-names>M.</given-names></name> <name><surname>Natale</surname> <given-names>D.</given-names></name> <name><surname>Koonin</surname> <given-names>E.</given-names></name></person-group> (<year>2000</year>). <article-title>The COG database: A tool for genome-scale analysis of protein functions and evolution.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>28</volume> <fpage>33</fpage>&#x2013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1093/nar/28.1.33</pub-id> <pub-id pub-id-type="pmid">10592175</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tettelin</surname> <given-names>V.</given-names></name> <name><surname>Masignani</surname> <given-names>M. J.</given-names></name> <name><surname>Cieslewicz</surname> <given-names>C.</given-names></name> <name><surname>Donati</surname> <given-names>D.</given-names></name> <name><surname>Medini</surname> <given-names>N. L.</given-names></name> <name><surname>Ward</surname> <given-names>S. V.</given-names></name><etal/></person-group> (<year>2005</year>). &#x201C;<article-title>Genome analysis of multiple pathogenic isolates of Streptococcus agalactiae: Implications for the microbial 201c;pan-genome, 201d</article-title>,&#x201D; in <source><italic>Proceedings of the National Academy of Sciences</italic></source>, <volume>Vol. 102</volume> (<publisher-name>Springer</publisher-name>), <fpage>13950</fpage>&#x2013;<lpage>13955</lpage>.</citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tokuda</surname> <given-names>M.</given-names></name> <name><surname>Shintani</surname> <given-names>M.</given-names></name></person-group> (<year>2024</year>). <article-title>Microbial evolution through horizontal gene transfer by mobile genetic elements.</article-title> <source><italic>Microb .Biotechnol.</italic></source> <volume>17</volume>:<fpage>e14408</fpage>. <pub-id pub-id-type="doi">10.1111/1751-7915.14408</pub-id> <pub-id pub-id-type="pmid">38226780</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>T&#x00F8;njum</surname> <given-names>T.</given-names></name> <name><surname>Welty</surname> <given-names>D.</given-names></name> <name><surname>Jantzen</surname> <given-names>E.</given-names></name> <name><surname>Small</surname> <given-names>P.</given-names></name></person-group> (<year>1998</year>). <article-title>Differentiation of Mycobacterium ulcerans, M. marinum, and M. haemophilum: Mapping of their relationships to M. tuberculosis by fatty acid profile analysis, DNA-DNA hybridization, and 16S rRNA gene sequence analysis.</article-title> <source><italic>J. Clin. Microbiol.</italic></source> <volume>36</volume> <fpage>918</fpage>&#x2013;<lpage>925</lpage>. <pub-id pub-id-type="doi">10.1128/JCM.36.4.918-925.1998</pub-id> <pub-id pub-id-type="pmid">9542909</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tonkin-Hill</surname> <given-names>G.</given-names></name> <name><surname>Gladstone</surname> <given-names>R.</given-names></name> <name><surname>P&#x00F6;ntinen</surname> <given-names>A.</given-names></name> <name><surname>Arredondo-Alonso</surname> <given-names>S.</given-names></name> <name><surname>Bentley</surname> <given-names>S.</given-names></name> <name><surname>Corander</surname> <given-names>J.</given-names></name></person-group> (<year>2023</year>). <article-title>Robust analysis of prokaryotic pangenome gene gain and loss rates with Panstripe.</article-title> <source><italic>Genome Res.</italic></source> <volume>33</volume> <fpage>129</fpage>&#x2013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1101/gr.277340.122</pub-id> <pub-id pub-id-type="pmid">36669850</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tonkin-Hill</surname> <given-names>G.</given-names></name> <name><surname>MacAlasdair</surname> <given-names>N.</given-names></name> <name><surname>Ruis</surname> <given-names>C.</given-names></name> <name><surname>Weimann</surname> <given-names>A.</given-names></name> <name><surname>Horesh</surname> <given-names>G.</given-names></name> <name><surname>Lees</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Producing polished prokaryotic pangenomes with the Panaroo pipeline.</article-title> <source><italic>Genome Biol.</italic></source> <volume>21</volume>:<fpage>180</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-020-02090-4</pub-id> <pub-id pub-id-type="pmid">32698896</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tsai</surname> <given-names>H.</given-names></name> <name><surname>Kunin</surname> <given-names>C.</given-names></name> <name><surname>Lee</surname> <given-names>S.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Wann</surname> <given-names>S.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Fish gambler&#x2019;s tenosynovitis caused by Mycobacterium marinum: Environmental investigation of a fishing pond in Southern Taiwan.</article-title> <source><italic>Diagn. Microbiol. Infect. Dis.</italic></source> <volume>59</volume> <fpage>227</fpage>&#x2013;<lpage>230</lpage>. <pub-id pub-id-type="doi">10.1016/j.diagmicrobio.2007.04.005</pub-id> <pub-id pub-id-type="pmid">17572037</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tsiolakkis</surname> <given-names>G.</given-names></name> <name><surname>Liontos</surname> <given-names>A.</given-names></name> <name><surname>Filippas-Ntekouan</surname> <given-names>S.</given-names></name> <name><surname>Matzaras</surname> <given-names>R.</given-names></name> <name><surname>Theodorou</surname> <given-names>E.</given-names></name> <name><surname>Vardas</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2023</year>). <article-title>Mycobacterium marinum: A case-based narrative review of diagnosis and management.</article-title> <source><italic>Microorganisms</italic></source> <volume>11</volume>:<fpage>1799</fpage>. <pub-id pub-id-type="doi">10.3390/microorganisms11071799</pub-id> <pub-id pub-id-type="pmid">37512971</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Uplekar</surname> <given-names>S.</given-names></name> <name><surname>Heym</surname> <given-names>B.</given-names></name> <name><surname>Friocourt</surname> <given-names>V.</given-names></name> <name><surname>Rougemont</surname> <given-names>J.</given-names></name> <name><surname>Cole</surname> <given-names>S.</given-names></name></person-group> (<year>2011</year>). <article-title>Comparative genomics of Esx genes from clinical isolates of Mycobacterium tuberculosis provides evidence for gene conversion and epitope variation.</article-title> <source><italic>Infect .Immun.</italic></source> <volume>79</volume> <fpage>4042</fpage>&#x2013;<lpage>4049</lpage>. <pub-id pub-id-type="doi">10.1128/IAI.05344-11</pub-id> <pub-id pub-id-type="pmid">21807910</pub-id></citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>van Dongen</surname> <given-names>S.</given-names></name> <name><surname>Abreu-Goodger</surname> <given-names>C.</given-names></name></person-group> (<year>2012</year>). <article-title>Using MCL to extract clusters from networks.</article-title> <source><italic>Methods Mol. Biol.</italic></source> <volume>804</volume> <fpage>281</fpage>&#x2013;<lpage>295</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-61779-361-5_15</pub-id> <pub-id pub-id-type="pmid">22144159</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vasudevan</surname> <given-names>K.</given-names></name> <name><surname>Devanga Ragupathi</surname> <given-names>N.</given-names></name> <name><surname>Jacob</surname> <given-names>J.</given-names></name> <name><surname>Veeraraghavan</surname> <given-names>B.</given-names></name></person-group> (<year>2020</year>). <article-title>Highly accurate-single chromosomal complete genomes using IonTorrent and MinION sequencing of clinical pathogens.</article-title> <source><italic>Genomics</italic></source> <volume>112</volume> <fpage>545</fpage>&#x2013;<lpage>551</lpage>. <pub-id pub-id-type="doi">10.1016/j.ygeno.2019.04.006</pub-id> <pub-id pub-id-type="pmid">30978388</pub-id></citation></ref>
<ref id="B66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wolinsky</surname> <given-names>E.</given-names></name></person-group> (<year>1992</year>). <article-title>Mycobacterial diseases other than tuberculosis.</article-title> <source><italic>Clin. Infect. Dis.</italic></source> <volume>15</volume> <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1093/clinids/15.1.1</pub-id> <pub-id pub-id-type="pmid">1617048</pub-id></citation></ref>
<ref id="B67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wongworawat</surname> <given-names>M.</given-names></name> <name><surname>Holtom</surname> <given-names>P.</given-names></name> <name><surname>Learch</surname> <given-names>T.</given-names></name> <name><surname>Fedenko</surname> <given-names>A.</given-names></name> <name><surname>Stevanovic</surname> <given-names>M. V. A.</given-names></name></person-group> (<year>2003</year>). <article-title>prolonged case of Mycobacterium marinum flexor tenosynovitis: Radiographic and histological correlation, and review of the literature.</article-title> <source><italic>Skeletal. Radiol.</italic></source> <volume>32</volume> <fpage>542</fpage>&#x2013;<lpage>545</lpage>. <pub-id pub-id-type="doi">10.1007/s00256-003-0636-y</pub-id> <pub-id pub-id-type="pmid">12879295</pub-id></citation></ref>
<ref id="B68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>H.</given-names></name> <name><surname>Wang</surname> <given-names>D.</given-names></name> <name><surname>Gao</surname> <given-names>F.</given-names></name></person-group> (<year>2021</year>). <article-title>Toward a high-quality pan-genome landscape of Bacillus subtilis by removal of confounding strains.</article-title> <source><italic>Brief. Bioinform.</italic></source> <volume>22</volume> <fpage>1951</fpage>&#x2013;<lpage>1971</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbaa013</pub-id> <pub-id pub-id-type="pmid">32065216</pub-id></citation></ref>
<ref id="B69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>H.</given-names></name> <name><surname>Yang</surname> <given-names>Z.</given-names></name> <name><surname>Yang</surname> <given-names>T.</given-names></name> <name><surname>Wang</surname> <given-names>D.</given-names></name> <name><surname>Luo</surname> <given-names>H.</given-names></name> <name><surname>Gao</surname> <given-names>F.</given-names></name></person-group> (<year>2022</year>). <article-title>An effective preprocessing method for high-quality pan-genome analysis of Bacillus subtilis and. Escherichia coli.</article-title> <source><italic>Methods Mol. Biol.</italic></source> <fpage>371</fpage>&#x2013;<lpage>390</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-0716-1720-5_21</pub-id> <pub-id pub-id-type="pmid">34709628</pub-id></citation></ref>
<ref id="B70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>S.</given-names></name> <name><surname>Hu</surname> <given-names>E.</given-names></name> <name><surname>Cai</surname> <given-names>Y.</given-names></name> <name><surname>Xie</surname> <given-names>Z.</given-names></name> <name><surname>Luo</surname> <given-names>X.</given-names></name> <name><surname>Zhan</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2024</year>). <article-title>Using clusterProfiler to characterize multiomics data.</article-title> <source><italic>Nat. Protoc.</italic></source> <volume>19</volume> <fpage>3292</fpage>&#x2013;<lpage>3320</lpage>. <pub-id pub-id-type="doi">10.1038/s41596-024-01020-z</pub-id> <pub-id pub-id-type="pmid">39019974</pub-id></citation></ref>
</ref-list>
</back>
</article>