<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2017.00443</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A Glimpse into the World of Integrative and Mobilizable Elements in Streptococci Reveals an Unexpected Diversity and Novel Families of Mobilization Proteins</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Coluzzi</surname> <given-names>Charles</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/266064/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gu&#x00E9;don</surname> <given-names>G&#x00E9;rard</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/285997/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Devignes</surname> <given-names>Marie-Dominique</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ambroset</surname> <given-names>Chlo&#x00E9;</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Loux</surname> <given-names>Valentin</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/197428/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Lacroix</surname> <given-names>Thomas</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/279292/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Payot</surname> <given-names>Sophie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/182662/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Leblond-Bourget</surname> <given-names>Nathalie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/257701/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>UMR1128 DynAMic, Institut National de la Recherche Agronomique, Universit&#x00E9; de Lorraine,</institution> <country>Vand&#x0153;uvre-l&#x00E8;s-Nancy, France</country></aff>
<aff id="aff2"><sup>2</sup><institution>UMR7503 Laboratoire Lorrain de Recherche en Informatique et ses Applications, Centre National de la Recherche Scientifique, Universit&#x00E9; de Lorraine,</institution> <country>Vand&#x0153;uvre-l&#x00E8;s-Nancy, France</country></aff>
<aff id="aff3"><sup>3</sup><institution>UR1404 Math&#x00E9;matiques et Informatique Appliqu&#x00E9;es du G&#x00E9;nome &#x00E0; l&#x2019;Environnement, Institut National de la Recherche Agronomique, Universit&#x00E9; Paris-Saclay,</institution> <country>Jouy-en-Josas, France</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: <italic>Rakesh Sharma, Institute of Genomics and Integrative Biology (CSIR), India</italic></p></fn>
<fn fn-type="edited-by"><p>Reviewed by: <italic>Joshua Peter Ramsay, Curtin University, Australia; Nikolai Ravin, Institute of Bioengineering, Research Center of Biotechnology of the Russian Academy of Sciences, Russia</italic></p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x002A;Correspondence: <italic>Nathalie Leblond-Bourget, <email>nathalie.leblond@univ-lorraine.fr</email></italic></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Evolutionary and Genomic Microbiology, a section of the journal Frontiers in Microbiology</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>20</day>
<month>03</month>
<year>2017</year>
</pub-date>
<pub-date pub-type="collection">
<year>2017</year>
</pub-date>
<volume>8</volume>
<elocation-id>443</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>01</month>
<year>2017</year>
</date>
<date date-type="accepted">
<day>03</day>
<month>03</month>
<year>2017</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2017 Coluzzi, Gu&#x00E9;don, Devignes, Ambroset, Loux, Lacroix, Payot and Leblond-Bourget.</copyright-statement>
<copyright-year>2017</copyright-year>
<copyright-holder>Coluzzi, Gu&#x00E9;don, Devignes, Ambroset, Loux, Lacroix, Payot and Leblond-Bourget</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Recent analyses of bacterial genomes have shown that integrated elements that transfer by conjugation play an essential role in horizontal gene transfer. Among these elements, the integrative and mobilizable elements (IMEs) are known to encode their own excision and integration machinery, and to carry all the sequences or genes necessary to hijack the mating pore of a conjugative element for their own transfer. However, knowledge of their prevalence and diversity is still severely lacking. In this work, an extensive analysis of 124 genomes from 27 species of <italic>Streptococcus</italic> reveals 144 IMEs. These IMEs encode either tyrosine or serine integrases. The identification of IME boundaries shows that 141 are specifically integrated in 17 target sites. The IME-encoded relaxases belong to nine superfamilies, among which four are previously unknown in any mobilizable or conjugative element. A total of 118 IMEs are found to encode a non-canonical relaxase related to rolling circle replication initiators (belonging to the four novel families or to MobT). Surprisingly, among these, 83 encode a TcpA protein (i.e., a non-canonical coupling protein (CP) that is more closely related to FtsK than VirD4) that was not previously known to be encoded by mobilizable elements. Phylogenetic analyses reveal not only many integration/excision module replacements but also losses, acquisitions or replacements of TcpA genes between IMEs. This glimpse into the still poorly known world of IMEs reveals that mobilizable elements have a very high prevalence. Their diversity is even greater than expected, with most encoding a CP and/or a non-canonical relaxase.</p>
</abstract>
<kwd-group>
<kwd>mobilizable elements</kwd>
<kwd>relaxase</kwd>
<kwd>TcpA coupling protein</kwd>
<kwd>conjugation</kwd>
<kwd><italic>Streptococcus</italic></kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="50"/>
<page-count count="16"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec><title>Introduction</title>
<p>Conjugative elements drive horizontal gene transfer between bacteria, and therefore play a key role in bacterial evolution. These mobile elements encode all factors needed for their autonomous transfer by conjugation. The conjugative transfer of various plasmids from Gram-negative (G-) bacteria, especially proteobacteria, is well understood (<xref ref-type="bibr" rid="B11">Cabezon et al., 2015</xref>; <xref ref-type="bibr" rid="B13">Chandran Darbari and Waksman, 2015</xref>; <xref ref-type="bibr" rid="B25">Ilangovan et al., 2015</xref>) and proceeds as follows. The plasmid DNA is recognized and processed by the relaxosome, a complex that includes a relaxase protein encoded by the element. Up to now, six superfamilies of relaxases (MobC, MobF, MobH, MobP, MobQ, and MobV) are known to be encoded by conjugative plasmids from proteobacteria (<xref ref-type="bibr" rid="B17">Garcillan-Barcia et al., 2009</xref>) and are referred in this paper as canonical relaxases. The relaxase catalyzes a site- and strand-specific cleavage of the origin of transfer (<italic>oriT</italic>) at the <italic>nic</italic> site of its cognate plasmid. The relaxase-tethered DNA is then recruited to the coupling protein (CP) belonging to the VirD4 family. The CP interacts with a multi-protein complex known as a type IV secretion system (T4SS) which spans the cellular envelope of the donor cell. The CP and T4SS subsequently translocate the single-strand DNA-relaxase complex through membranes and cell walls into the recipient cell. The nicking of <italic>oriT</italic> by the relaxase also initiates a rolling-circle replication (RCR) of the plasmid by cellular enzymes so that the donor cell retains the plasmid and the recipient cell acquires the plasmid. In addition to conjugative plasmids, other autonomous elements called integrative and conjugative elements (or ICEs) are found to be integrated in the chromosomes of bacteria. ICEs encode their own excision, transfer by conjugation, and integration (for reviews see <xref ref-type="bibr" rid="B10">Burrus et al., 2002</xref>; <xref ref-type="bibr" rid="B7">Bellanger et al., 2014</xref>). Apart from the excision and integration steps that are catalyzed by a tyrosine recombinase, a serine recombinase or a DDE transposase, the conjugative transfer of most ICEs is assumed to resemble that of plasmids of G- bacteria, and therefore to involve a relaxase, a CP and a T4SS machinery.</p>
<p>Many other mobile elements, known as mobilizable elements, hijack the conjugative machinery of unrelated conjugative elements (<xref ref-type="bibr" rid="B16">Francia et al., 2004</xref>; <xref ref-type="bibr" rid="B17">Garcillan-Barcia et al., 2009</xref>; <xref ref-type="bibr" rid="B33">Meyer, 2009</xref>). The best known mobilizable elements are the mobilizable plasmids from G- bacteria. While a very few mobilizable plasmids encode a CP, they never encode any other protein belonging to the T4SS. Almost all of them encode a relaxase from one of the six canonical superfamilies, but which is distantly related to those of the conjugative plasmids. These relaxases recognize and cut their cognate <italic>oriT</italic> (<xref ref-type="bibr" rid="B16">Francia et al., 2004</xref>; <xref ref-type="bibr" rid="B33">Meyer, 2009</xref>). They then recruit the CP and/or T4SS of a conjugative element to mobilize <italic>in trans</italic> the non-autonomous element. In addition to mobilizable plasmids, some integrative elements known as integrative and mobilizable elements (IMEs) also transfer by mobilization. IMEs encode their own excision and integration but carry only some of the sequences or genes necessary for their conjugative transfer (for a review, see <xref ref-type="bibr" rid="B7">Bellanger et al., 2014</xref>). Most of the very few IMEs described so far carry their own <italic>oriT</italic> and encode their own relaxase, but none encode a CP or any protein belonging to the T4SS. Other previously described IMEs carry their own <italic>oriT</italic> but do not encode any protein involved in conjugation. To date, very few genomes searches have focused explicitly on IMEs so their prevalence and diversity are essentially unknown (<xref ref-type="bibr" rid="B9">Brochet et al., 2008</xref>; <xref ref-type="bibr" rid="B7">Bellanger et al., 2014</xref>). However, <xref ref-type="bibr" rid="B24">Guglielmini et al. (2011)</xref> performed an extensive search for relaxases and conjugation modules in 1124 archaeal and bacterial genomes, and identified many isolated relaxase genes on chromosomes, which suggests that IMEs are the most prevalent elements that transfer by conjugation.</p>
<p>While conjugation and mobilization mechanisms are well known in G- proteobacteria, they are poorly documented in all other bacterial clades, including the Firmicutes, a major group of Gram-positive (G+) bacteria. The conjugative plasmids and ICEs from firmicutes encode T4SSs belonging to two families, FA and FATA, that have not been found in G- bacteria (<xref ref-type="bibr" rid="B23">Guglielmini et al., 2014</xref>). The FATA T4SS was found to be associated with classical CPs (VirB4) and with relaxases belonging to the canonical MobP, MobQ, and MobC superfamilies (<xref ref-type="bibr" rid="B22">Guglielmini et al., 2013</xref>; <xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). In contrast, most plasmids and ICEs with FA T4SSs encode TcpA CPs instead of VirD4. The TcpA CPs are related to FtsK, the double strand DNA translocase involved in DNA segregation during cell division (<xref ref-type="bibr" rid="B22">Guglielmini et al., 2013</xref>; <xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). Furthermore, all the plasmids and ICEs that encode FA T4SSs and TcpAs CPs encode non-canonical relaxases. Thus, the pCW3 conjugative plasmid from the Firmicute <italic>Clostridium perfringens</italic>, which encodes a FA T4SS and a TcpA CP, was recently shown to encode a novel type of relaxase related to tyrosine recombinase (<xref ref-type="bibr" rid="B50">Wisniewski et al., 2016</xref>). In the same way, all ICEs, which encode a FA T4SS and a TcpA CP, encode a relaxase belonging to the non-canonical MobT superfamily. The MobT relaxases are related to a family of RCR initiators involved in the intracellular replication and maintenance of small plasmids (<xref ref-type="bibr" rid="B22">Guglielmini et al., 2013</xref>; <xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). MobT encoded by ICE<italic>Bs1</italic> is involved in both conjugative transfer and in replication of the excised ICE [for a review, see (<xref ref-type="bibr" rid="B4">Auchtung et al., 2016</xref>)]. It should be mentioned that most families of relaxases involved in the RCR of small plasmids or viruses are clearly distinct from and perhaps unrelated to the superfamilies of relaxases found in conjugative and mobilizable elements. Besides the MobT relaxases encoded by the ICEs with FA T4SS and TcpA CP, the only other exception corresponds to PF01446 RCR initiators of some mobilizable plasmids of firmicutes that are involved in both plasmid replication and mobilization by ICEs encoding TcpA CPs (<xref ref-type="bibr" rid="B34">Naglich and Andrews, 1988</xref>; <xref ref-type="bibr" rid="B43">Showsh and Andrews, 1999</xref>; <xref ref-type="bibr" rid="B29">Lee et al., 2012</xref>).</p>
<p>Streptococci are G+ bacteria belonging to the Firmicutes. Genome and phylogenetic analyses have shown that a large proportion of the streptococcal genomes has experienced horizontal gene transfer (<xref ref-type="bibr" rid="B41">Richards et al., 2014</xref>). Previously, our extensive analyses of the genomes of 124 strains belonging to 27 streptococcal species revealed a high prevalence of ICEs (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>), suggesting that a significant fraction of these transfers could be due to those elements. Furthermore, a comprehensive search of IMEs performed on eight available genomes of the firmicute <italic>Streptococcus agalactiae</italic> revealed twelve IMEs (<xref ref-type="bibr" rid="B9">Brochet et al., 2008</xref>). Surprisingly, this search also detected nine genomic islands which possess a complete integration/excision module and encode a putative CP belonging to TcpA family, but which do not encode any proteins related to known relaxases. Therefore, these elements could correspond to IMEs encoding a relaxase that is very distantly related or unrelated to known relaxases. A preliminary reanalysis of these nine elements from <italic>S. agalactiae</italic> revealed that they encode proteins related to RCR initiators from plasmids or viruses, suggesting that these elements are probably IMEs encoding novel types of relaxases related to RCR initiators. In this study, we searched for IMEs in the 124 publicly available complete genomes of <italic>Streptococcus</italic> that were previously used for the ICE search. IMEs were defined by the combined presence of putative integrases and relaxases (related to classical relaxases or to RCR initiators), the eventual presence of putative CPs (VirD4 or TcpA), and the absence of T4SSs. CDSs encoding these signature proteins were localized on the chromosomes and their boundaries and integration site of IMEs were identified. This study (i) gives a general overview of the very high prevalence and diversity of putative IMEs within streptococci, (ii) identifies their numerous specific sites of insertion, (iii) reveals that most IMEs harbor a versatile and compact mobilization module that encodes a non-canonical relaxase related to RCR initiators and generally a non-canonical CP related to FtsK.</p>
</sec>
<sec id="s1" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec><title>Genomes Examined and Database of Reference Proteins</title>
<p>The dataset of the 124 complete chromosomes from <italic>Streptococcus</italic> species available at the start of the present study was taken from Genbank<sup><xref ref-type="fn" rid="fn01">1</xref></sup>. This initial database of reference proteins contains signature proteins from ICEs and the few IMEs reported for Firmicutes in the literature. It includes protein sequences from 50 tyrosine integrases, 13 serine integrases, 2 DDE transposases, 50 relaxases, 37 CPs, and 26 VirB4 proteins (a T4SS ATPase). This last protein has never been found in any mobilizable elements and is used here as the main criterion for differentiating between ICEs and IMEs at the detection step.</p>
</sec>
<sec><title>Workflow</title>
<p>The overall workflow of our search strategy to detect and characterize IMEs in streptococcal chromosomes was described previously (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). This workflow allows (i) detecting ICEs from the presence of signature CDSs grouped on the genome, (ii) identifying ICE insertion sites and (iii) delineating ICEs. The workflow was adapted to IME detection by modifying the signature CDSs in step (i): a putative IME is detected when no VirB4 CDS is present and when an integrase CDS is found in the vicinity of a relaxase CDS. Steps (ii) and (iii) were conducted in the same way as for ICEs.</p>
<p>When an IME signature CDS was missing or incomplete (pseudogene), the corresponding complete CDS encoded by the closest known IME was taken and compared to the putative defective one by tBlastN in order to detect possible genome annotation errors (e.g., identification of an authentic gene as a pseudogene most frequently due to the presence of a type II intron within the gene or mis-identification of the &#x201C;start&#x201D; codon). Because before this work, the known IMEs did not encode a CP, those elements carrying an integrase gene, a relaxase gene, and a CP pseudogene were considered as IMEs. Moreover, our workflow detects elements containing only an integrase and a CP CDS but apparently no relaxase gene or pseudogene. In such cases, an exhaustive manual analysis was performed to search for new relaxase genes, in particular for genes encoding proteins related to RCR initiators. Newly found relaxases were added to the database of reference proteins and step (i) was reiterated on all genomes. In summary, we considered as IMEs all elements delimited by direct repeats and containing at least one CDS for one complete integrase as well as one complete relaxase, but no CDS for VirB4 or other proteins of the T4SS.</p>
</sec>
<sec><title>Denomination of IMEs</title>
<p>Each IME name indicates by letters and numbers the species and strain of the host bacteria. When an IME encodes a site-specific integrase, its denomination also specifies the name of the target gene. IMEs marked with an asterisk are not integrated in their primary site but in a secondary one as previously observed for ICEs (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>).</p>
</sec>
<sec><title>Domain Composition Analysis and Tree Construction</title>
<p>The retrieval of the domain composition of all IME signature proteins from Uniprot annotations was done in batch using the BioMart Central Portal<sup><xref ref-type="fn" rid="fn02">2</xref></sup>. <italic>De novo</italic> conserved domain search (CD-search<sup><xref ref-type="fn" rid="fn03">3</xref></sup>) and/or PSI-Blast analyses were performed when no data was available through BioMart. The correspondence with Mob families was established using the CONJscan-T4SSscan program<sup><xref ref-type="fn" rid="fn04">4</xref></sup> (<xref ref-type="bibr" rid="B24">Guglielmini et al., 2011</xref>). This tool is no longer accessible but should soon be available on the Pasteur Galaxy server.</p>
<p>The signature proteins were aligned using Clustal omega with default parameters (<xref ref-type="bibr" rid="B44">Sievers et al., 2011</xref>). The trees of signature proteins were built with MEGA (<xref ref-type="bibr" rid="B46">Tamura et al., 2013</xref>) using (i) maximum likelihood (ML) based on the JTT (Jones&#x2013;Taylor&#x2013;Thornton) model including amino acid empirical frequencies (partial deletion of gaps and missing data at 80% cutoff, Gamma distribution in five categories, allowance for invariant sites), and (ii) BioNJ methods with the Poisson model (<xref ref-type="bibr" rid="B20">Gouy et al., 2010</xref>). The branch support of the groupings was estimated using bootstrap (100 replicates).</p>
</sec>
<sec><title>Protein Clustering and Signature Proteins Associations</title>
<p>Protein clustering at 90 and 40% sequence identity was performed using BLASTclust<sup><xref ref-type="fn" rid="fn05">5</xref></sup> (<xref ref-type="bibr" rid="B2">Alva et al., 2016</xref>) with default parameters. Circos<sup><xref ref-type="fn" rid="fn06">6</xref></sup> was used to visualize the signature protein associations (<xref ref-type="bibr" rid="B26">Krzywinski et al., 2009</xref>). The functional annotation of IMEs was performed using Agmial as described previously (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>).</p>
</sec>
</sec>
<sec><title>Results</title>
<sec><title>Prevalence of IMEs within Streptococcal Chromosomes</title>
<p>The prevalence of IMEs was studied in a large set of species (27 <italic>Streptococcus</italic> species) and strains (<italic>n</italic> = 124). This exhaustive examination led to the identification of 144 IMEs. Their sizes ranged from 5 to 18 kb (Supplementary Table <xref ref-type="supplementary-material" rid="SM7">S1</xref>) except for IME_<italic>Sparas15912_rpsI</italic> which was 53 kb. The larger size of IME_<italic>Sparas15912_rpsI</italic> has likely resulted from a tandem ICE-IME insertion in the element. Within streptococcal genomes, this study showed that IME sizes (mean = 10 kb) were generally smaller than those of ICEs (mean = 41 kb). This difference is reminiscent of that observed between mobilizable and conjugative plasmids (<xref ref-type="bibr" rid="B45">Smillie et al., 2010</xref>).</p>
<p>Ten IMEs were found to be integrated in tandem accretion with other IMEs (IME1-IME2) or with ICEs (ICE-IME or ICE-IME1-IME2) (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>) and many with decayed elements (data not shown). Nine tandems were found to be integrated in the 3&#x2032; end of <italic>rpsI</italic>, <italic>rpmG</italic>, or <italic>rplL</italic>. The last one was integrated in a secondary site inside IME_<italic>Sparas15912_rpsI.</italic> All IMEs in accretion in the same site had a tyrosine integrase but some decayed IMEs in accretion were found to encode serine integrases (data not shown). These integrases had from 21 to 69% sequence identity, showing that there was no particular relatedness between integrases encoded by elements in accretion.</p>
<p>More than half (<italic>n</italic> = 78) of the streptococcal chromosomes contained at least one IME. As seen in Supplementary Table <xref ref-type="supplementary-material" rid="SM7">S1</xref>, the occurrence of IMEs varied within species and strains. For instance, most of the 20 <italic>S. pyogenes</italic> chromosomes were deprived of IMEs, whereas the 3 <italic>S. anginosus</italic> chromosomes each contained from 4 to 6 IMEs. Interestingly, the genomes that contained the lowest numbers of IMEs (<italic>S. pyogenes</italic> with an average of 0.1 IME per genome) also contain few ICEs (0.1 ICE per genome). The opposite was also true; the genomes from <italic>S. anginosus</italic> were among those containing the highest numbers of IMEs (mean = 4.7) as well as ICEs (mean = 4.3).</p>
</sec>
<sec><title>Diversity of Integration Modules and Integration Sites of Streptococcal IMEs</title>
<p>Almost all of the integrase genes of streptococcal IMEs were located at one end of the element and were outward facing. These integrases belonged to two unrelated superfamilies: tyrosine integrases and serine integrases.</p>
<sec><title>Diversity of IME Tyrosine Integrases and of Their Integration Sites</title>
<p>Tyrosine integrases were detected in more than 89% of the IMEs (<italic>n</italic> = 128/144). Both phylogenetic analysis and clustering of the tyrosine integrases at 40% sequence identity allowed them to be classified in 10 distinct families (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>). In most cases, tyrosine integrases belonging to the same family catalyze integration in the same gene (<bold>Figures <xref ref-type="fig" rid="F1">1</xref></bold>, <bold><xref ref-type="fig" rid="F2">2</xref></bold>). For instance, all tyrosine integrases allocated to family Tyr_1 target the 3&#x2032; end of the tRNAleu gene. Three exceptions to this rule were observed. First, the Tyr_3 family includes tyrosine integrases targeting two distinct insertion genes (<italic>guaA</italic> or <italic>rplL</italic>). Phylogenetic analysis of these integrases suggests an evolution from <italic>guaA</italic> specificity to <italic>rplL</italic> specificity (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>). Second, the Tyr_4 family gathers all integrases targeting <italic>rpmE</italic> and one integrase targeting <italic>rpsI</italic>. Phylogenetic analysis of these integrases and the sister Tyr_5 group of integrases suggests an evolution from <italic>rpsI</italic> specificity to <italic>rpmE</italic> specificity. Third, integrases of family Tyr_8 catalyze integration within genes encoding four different tRNAs (tRNAasn, tRNAleu, tRNAlys, and tRNAarg). Although catalyzing integration in distinct tRNA genes, all integrases from family Tyr_8 share the ability to generate short direct repeats (DRs).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p><bold>Phylogenetic tree of tyrosine integrases.</bold> One representative of each 90% protein identity cluster from integrative and mobilizable elements (IMEs) (in black) and one representative of each 90% protein identity cluster of tyrosine integrases from ICEs targeting the same site as IMEs (in mauve and underlined) are presented in the ML tree. Bootstrap values (BioNJ/ML) are given only when they exceed 50 for both analyses. The target gene is mentioned in the IME/ICE names. Tyrosine integrases sharing more than 40% sequence identity and therefore belonging to the same family are merged with brackets. These families are distinguished with different numbers. The DR length or integrase position is indicated to distinguish tyrosine integrases belonging to different families but targeting the same genes. Refer to Supplementary Table <xref ref-type="supplementary-material" rid="SM7">S1</xref> for IME and strain details.</p></caption>
<graphic xlink:href="fmicb-08-00443-g001.tif"/>
</fig>
<p>In the majority of cases, each insertion gene is specifically targeted by closely related tyrosine integrases grouped in one unique family (<bold>Figures <xref ref-type="fig" rid="F1">1</xref></bold>, <bold><xref ref-type="fig" rid="F2">2</xref></bold>). Exceptions were <italic>rpsI, rpmG</italic>, and the tRNAleu genes that are targeted by integrases belonging to several families. More specifically, <italic>rpsI</italic> is targeted by tyrosine integrases belonging to three distinct families; the integrases from families Tyr_4 and Tyr_5 lead to the formation of long DRs whereas those from family Tyr_7 all have short DRs (<bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>). Similarly, the integrases targeting the tRNAleu gene belong to two distinct families; the integrases from family Tyr_1 have long DRs, and those from family Tyr_8 have short DRs. Finally, two families of integrases catalyze integration in <italic>rpmG</italic> and lead to two distinct architectures after integration: genes encoding integrases from family Tyr_10 are adjacent to <italic>rpmG</italic>, whereas those encoding integrases from family Tyr_6 are at the opposite end of the IME.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p><bold>Integrative and mobilizable element integration loci and their position relative to the integrase CDSs.</bold> Tyrosine and serine integrase genes are shown in red and green, respectively. The target genes (dark blue) encode, respectively: <italic>ebfC</italic> [nucleoid associated protein], <italic>guaA</italic> [GMP synthase], <italic>maff2</italic> [conserved membrane protein of ICEs belonging to Tn<italic>5252</italic> superfamily], <italic>rpsI</italic> [S9 ribosomal protein], <italic>rplL</italic> [L7/L12 ribosomal protein]<italic>, rpmE</italic> [L31 ribosomal protein], <italic>rpmG</italic> [L33 ribosomal protein]<italic>, rumA</italic> [23S rRNA (uracil-5-) methyltransferase], <italic>snf2</italic> [helicase of ICEs belonging to Tn<italic>5252</italic> superfamily], <italic>tatD</italic> [DNAse], <italic>traG</italic> [VirD4 CP gene from ICEs belonging to Tn<italic>5252</italic> superfamily]. The DR size (in bp) within the target gene is indicated in blue and the one outside is in red. The number of ICEs integrated in a given site is marked at the bottom of each box.</p></caption>
<graphic xlink:href="fmicb-08-00443-g002.tif"/>
</fig>
<p>In summary, the analysis of the integration loci of 128 IMEs harboring a tyrosine integrase shows that these integrases specifically target 11 distinct genes, mainly (109/128) at the 3&#x2032; end of genes encoding tRNAs or ribosomal proteins. More rarely (19/128), tyrosine integrases from IMEs catalyze integration at the 3&#x2032; or 5&#x2032; end of other protein-encoding genes (<italic>guaA</italic>, <italic>tatD</italic>, or <italic>ebfC</italic>). This study has therefore extended the known list of possible integration sites for streptococcal IMEs with tyrosine integrases: only four integration sites were previously identified (<italic>oriT</italic> from ICEs belonging to Tn<italic>916</italic> and ICE<italic>St3</italic> families, 3&#x2032; <italic>rpsI</italic>, 3&#x2032; tRNALys gene and 3&#x2032; <italic>rpmG</italic>) (<xref ref-type="bibr" rid="B9">Brochet et al., 2008</xref>; <xref ref-type="bibr" rid="B38">Puymege et al., 2015</xref>; <xref ref-type="bibr" rid="B30">Lorenzo-Diaz et al., 2016</xref>).</p>
</sec>
<sec><title>Diversity of IME Serine Integrases and of Their Integration Sites</title>
<p>Our collection of IMEs contains 16 IMEs encoding a serine integrase. For two IMEs (IME_<italic>Sol3089_ND</italic> and IME_<italic>SsalCCHSS3_ND</italic>) encoding related integrases belonging to family Ser_2, we were unable to determine the specificity of integration because these two IMEs were integrated in two distinct intergenic regions (<bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>). Two other IMEs with serine integrases were found to be integrated within the bacterial gene <italic>rumA</italic>, which is already known to be a common integration site for ICEs with serine integrases (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). All other 12 IMEs were found to be integrated within conserved genes from ICEs belonging to the Tn<italic>5252</italic> superfamily: <italic>traG</italic> (encoding a VirD4 CP), <italic>maff2</italic> (encoding a membrane protein), and <italic>snf2</italic> (encoding a helicase) (Supplementary Table <xref ref-type="supplementary-material" rid="SM7">S1</xref>), thereby leading to gene disruption.</p>
<p>Both phylogenetic analysis and 40% sequence identity clustering of the serine integrases indicate that they may be classified in four distinct families (Ser_1 to 4, <bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S1</xref></bold>). A large majority of the serine integrases sharing the same integration specificity were grouped in the same family. For example, the integrases targeting the <italic>traG</italic>, <italic>snf2</italic>, and <italic>rumA</italic> genes were grouped in families Ser_1, Ser_3, and Ser_4, respectively. Exceptions were the two serine integrases targeting <italic>maff2</italic> that were found in two distinct families: the one belonging to family Ser_1 shows a close relatedness with integrases targeting <italic>traG</italic>, whereas the one belonging to family Ser_3 is related to integrases targeting <italic>snf2</italic>. These two integrases catalyze integration in two different locations within <italic>maff2</italic> and lead to the generation of distinct DRs (<bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>). This variability of integration within the same gene was also observed for integration inside <italic>traG</italic>. The two IMEs specific to <italic>snf2</italic> are integrated in the same location within <italic>snf2</italic>, but the recombination site of the IME is located within the integrase gene for IME_<italic>Spy2096_SNF2</italic>, whereas it is adjacent to the 3&#x2032; end of the integrase gene for IME_<italic>SsuT15_SNF2</italic> (<bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>).</p>
</sec>
<sec><title>Comparison of the Recombination Modules of IMEs and ICEs</title>
<p>Our collection of IMEs (this work) and ICEs (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>) from streptococci allowed us to compare the recombination modules of these two types of element. Both of them encode serine and tyrosine integrases, and their diversity is similar in IMEs and in ICEs. Indeed, we detected 18 distinct specificities for integrases from streptococcal IMEs (17 targeting a specific site and one with unknown specificity) and at least 17 for the ICEs. However, in contrast to the ICEs, no DDE transposase was found in any of the IMEs.</p>
<p>As shown in <bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold> and <bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S1</xref></bold>, several integrase families (such as Tyr_2, Tyr_3, Tyr_5, Tyr_6, Tyr_8, Tyr_10, and Ser_4) grouped both integrases from IMEs and ICEs. For three specificities: <italic>ebfC</italic> (Tyr_2), <italic>rplL</italic> (Tyr_3), and <italic>rpmG</italic> opposite (Tyr_6), tyrosine integrases from IMEs and ICEs belong to closely related sister groups. In family Tyr_5, the tyrosine integrases from IMEs targeting <italic>rpsI</italic> are mixed with those of the ICEs, and in cluster Ser_4 the serine integrase targeting <italic>rumA</italic> from IME<italic>_SpnAP200_rumA</italic> shares 91&#x2013;93% identity with those of two ICEs. Altogether, these results suggested that exchange of integration modules between ICEs and IMEs are frequent.</p>
</sec>
</sec>
<sec><title>New Relaxase Families Related to RCR Initiator Proteins in IMEs</title>
<p>A total of 154 relaxase genes were detected within IMEs (including three pseudogenes in IMEs harboring two relaxases). Based on their domain composition, the relaxases were classified in nine distinct superfamilies (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>). Among the four most prevalent relaxase superfamilies, only the Rel_PF02486 superfamily was recognized by the CONJscan-T4SSscan analysis as belonging to a known type of relaxase (MobT). The three others were novel superfamilies of relaxases characterized by the following domains: PF01719 (Rel_PF01719), PHA00330 (Rel_PHA00330) and by the combination of PF001719 and PF00910 (Rel_PF001719-PF00910). The Rel_PF02407 superfamily was the fourth novel superfamily identified in this study. All these new relaxase superfamilies discovered in IMEs harbored domains (PF01719, PHA00330, or PF02407) that were previously found exclusively in RCR initiators from viruses or plasmids (<xref ref-type="bibr" rid="B15">Ebisu et al., 1995</xref>; <xref ref-type="bibr" rid="B5">Bachrach et al., 2004</xref>; <xref ref-type="bibr" rid="B18">Gibbs et al., 2006</xref>; <xref ref-type="bibr" rid="B31">Lorenzo-Diaz et al., 2014</xref>). They were assumed to correspond to novel relaxase superfamilies since all these proteins were associated with an integrase and a large majority of these non-canonical relaxases (or all for PF02407) were associated with a CP in our IME collection. Four other relaxase superfamilies described in <bold>Table <xref ref-type="table" rid="T1">1</xref></bold> (Rel_PF03389, Rel_PF01076, Rel_PF13814, and Rel_PF03432) were recognized by the CONJscan-T4SSscan server as the MobQ, MobV, MobC, and MobP superfamilies, respectively.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Relaxase superfamilies based on domain composition.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Superfamily name</th>
<th valign="top" align="center">Domain(s) ID<sup>&#x2217;</sup></th>
<th valign="top" align="center">Domain name(s)</th>
<th valign="top" align="center">Conjscan domain</th>
<th valign="top" align="center">Number found</th>
<th valign="top" align="center">Number of clusters</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Rel_PF02486/MobT</td>
<td valign="top" align="center">PF02486</td>
<td valign="top" align="center">Rep_trans</td>
<td valign="top" align="center">MobT</td>
<td valign="top" align="center">55</td>
<td valign="top" align="center">6</td>
</tr>
<tr>
<td valign="top" align="left">Rel_PF01719</td>
<td valign="top" align="center">PF01719</td>
<td valign="top" align="center">Rep_2</td>
<td valign="top" align="center">No hit</td>
<td valign="top" align="center">35</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Rel_PH00330</td>
<td valign="top" align="center">PHA00330</td>
<td valign="top" align="center">Not applicable</td>
<td valign="top" align="center">No hit</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left">Rel_PF01719-PF00910</td>
<td valign="top" align="center">PF01719 + PF00910</td>
<td valign="top" align="center">Rep_2 +RNA_helicase</td>
<td valign="top" align="center">No hit</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">4</td>
</tr>
<tr>
<td valign="top" align="left">Rel_PF03389/MobQ</td>
<td valign="top" align="center">PF03389</td>
<td valign="top" align="center">MobA_MobL</td>
<td valign="top" align="center">MobQ</td>
<td valign="top" align="center">12</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Rel_PF01076/MobV</td>
<td valign="top" align="center">PF01076</td>
<td valign="top" align="center">Mob_Pre</td>
<td valign="top" align="center">MobV</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Rel_PF02407</td>
<td valign="top" align="center">PF02407</td>
<td valign="top" align="center">Viral-Rep</td>
<td valign="top" align="center">No hit</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Rel_PF13814/MobC</td>
<td valign="top" align="center">PF13814</td>
<td valign="top" align="center">Replic_Relax</td>
<td valign="top" align="center">MobC</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Rel_PF03432/MobP</td>
<td valign="top" align="center">PF03432</td>
<td valign="top" align="center">Relaxase</td>
<td valign="top" align="center">MobP</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td></tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic><sup>&#x2217;</sup>All domains are described in the Pfam classification except for domain PHA00330 that was found in the NCBI Conserved Domain classification without any Pfam equivalent.</italic></attrib>
</table-wrap-foot>
</table-wrap>
<p>On the basis of their relaxase content, the IMEs were grouped in nine classes (IME_Class_1 to 9) encoding a unique relaxase, one for each superfamily of relaxase (<bold>Table <xref ref-type="table" rid="T2">2</xref></bold>). An additional class (IME_Class_10) contained 10 IMEs that carry 2 relaxases: one belonging to the Rel_PF02486/MobT and the other to the Rel_PF01076/MobV. Each of the two relaxase superfamilies present in this class also exists as standalone relaxases in IME_Class_1 and IME_Class_6.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Diversity of the relaxases and CPs associated with serine and tyrosine integrases.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Integrase type (number)</th>
<th valign="top" align="center">Relaxase superfamily (number)</th>
<th valign="top" align="center">CP superfamily (number)</th>
<th valign="top" align="center">IME class</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Tyrosine integrase (128)</td>
<td valign="top" align="center">Rel_IME_1/MobT(45)</td>
<td valign="top" align="center">TcpA (24) or none (21)</td>
<td valign="top" align="center">Class_IME_1</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center">Rel_IME_2 (35)</td>
<td valign="top" align="center">TcpA (34<sup>&#x2217;</sup>) or none (1)</td>
<td valign="top" align="center">Class_IME_2</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center">Rel_IME_3 (21)</td>
<td valign="top" align="center">TcpA (19<sup>&#x2217;</sup>) or none (2)</td>
<td valign="top" align="center">Class_IME_3</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center">Rel_IME_4 (15)</td>
<td valign="top" align="center">TcpA (4) or none (11)</td>
<td valign="top" align="center">Class_IME_4</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center">Rel_IME_1/MobT (10<sup>&#x2217;</sup>) + Rel_IME_6/MobV(10<sup>&#x2217;</sup>)</td>
<td valign="top" align="center">None</td>
<td valign="top" align="center">Class_IME_10</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center">Rel_IME_7 (2)</td>
<td valign="top" align="center">TcpA (2)</td>
<td valign="top" align="center">Class_IME_7</td>
</tr>
<tr>
<td valign="top" align="left">Serine integrases (16)</td>
<td valign="top" align="center">Rel_IME_5/MobQ (12)</td>
<td valign="top" align="center">None</td>
<td valign="top" align="center">Class_IME_5</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center">Rel_IME_8/MobC (2)</td>
<td valign="top" align="center">VirD4 (2)</td>
<td valign="top" align="center">Class_IME_8</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center">Rel_IME_6/MobV (1)</td>
<td valign="top" align="center">None</td>
<td valign="top" align="center">Class_IME_6</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center">Rel_IME_9/MobP (1)</td>
<td valign="top" align="center">None</td>
<td valign="top" align="center">Class_IME_9</td></tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic><sup>&#x2217;</sup>Number includes pseudogenes.</italic></attrib>
</table-wrap-foot>
</table-wrap>
<p>Within each superfamily of relaxases, the diversity was estimated by phylogenetic analyses and 40% sequence identity clustering. The most abundant superfamily, Rel_PF02486/MobT (<bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM2">S2</xref></bold>), includes six families (Rel_PF02486_1 to 6), among which the family PF02486_3 was associated with a Rel_PF01076/MobV in IME_Class_10. In contrast, the 35 relaxases from the Rel_PF01719 superfamily are closely related and were therefore clustered in a unique family (<bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM3">S3</xref></bold>). The same was true for the 12 relaxases of the Rel_PF03389/MobQ superfamily (data not shown). The 21 members of the Rel_PHA00330 superfamily were grouped into three families (<bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM4">S4</xref></bold>), and the Rel_PF01719-PF00910 superfamily (15 members) analysis yielded four families (<bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S5</xref></bold>). Finally, the superfamily Rel_PF01076 was clustered in two families, with the Rel_PF01076_1 being always found in IME_Class_10. Overall, the IME relaxases showed a great diversity: they were classified in nine distinct superfamilies subdivided in 20 families (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>). It should be noted that the diversity of IME relaxases largely exceeds that of ICEs, since ICEs are classified in three superfamilies/eight families according to the same criteria (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). Only two superfamilies of relaxases corresponding to Rel_PF02486/MobT and Rel_PF03432/MobP are encoded by both IMEs and ICEs. However, our analysis showed that within these superfamilies, the relaxases of IMEs always belong to clearly distinct families from those including ICE relaxases. Moreover, whereas the number of Rel_PF02486/MobT relaxases found for ICEs and IMEs are similar, it can be stressed that Rel_PF03432/MobP relaxases constitute the most abundant superfamily in ICEs (62/105 relaxases) and the least abundant in IMEs (only 1/154 relaxases).</p>
</sec>
<sec><title>Half of the Streptococcal IMEs Encode a CP</title>
<p>Prior to the present study, none of the previously known or predicted IMEs encode a CP (<xref ref-type="bibr" rid="B7">Bellanger et al., 2014</xref>), and the few CPs that are known to be encoded by mobilizable plasmids belong to the VirD4 superfamily (<xref ref-type="bibr" rid="B17">Garcillan-Barcia et al., 2009</xref>). Surprisingly, our results show that more than half of the streptococcal IMEs encode a CP (85/144 including 11 pseudogenes of CP) and that almost all these CPs do not belong to the canonical VirD4 family. Indeed, only two IMEs encode a VirD4 CP characterized by a C-terminal VirD4 domain (COG3505 in the NCBI CDD classification). All others (72 proteins excluding pseudogenes) were found to display a unique PF01580 &#x201C;FtsK-SpoIIIE&#x201D; catalytic domain and to be more closely related to FtsK (a DNA translocase involved in DNA segregation during cell division) than to the canonical VirD4. According to the CONJscan-T4SSscan analysis, these proteins belong to a particular superfamily of CP named TcpA, found only in Firmicutes (<xref ref-type="bibr" rid="B22">Guglielmini et al., 2013</xref>). Reconstruction of their phylogeny and 40% identity clustering allowed their classification in 12 distinct families designated TcpA_1 to TcpA_12 (<bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM6">S6</xref></bold>). The three most abundant families, TcpA_4, TcpA_7, and TcpA_12, contained 11, 11, and 30 proteins, respectively. The nine others were found from only 1 to 6 IMEs.</p>
<p>The two superfamilies (VirD4 and TcpA) of CPs were found in both ICEs (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>) and IMEs with different prevalence. Within <italic>Streptococcus</italic> genomes, VirD4 CPs are encoded by 61/105 ICEs and by only the 2 IMEs belonging to IME_Class_8. In contrast, TcpA CPs are encoded by 44/105 ICEs (belonging to the Tn<italic>916</italic> superfamily) and 83/144 IMEs (belonging to class_1 to 4 and to class_7). Moreover, the diversity of TcpA CPs in IMEs is much larger than in ICEs (12 vs. 3 distinct families) which is reminiscent of relaxases (see above).</p>
</sec>
<sec><title>High Diversity of Association of the Different Classes of Signature Genes within IMEs</title>
<p>Our analysis of the co-occurrence of relaxase superfamilies, CPs, and integrases in IMEs reveals some mandatory associations, consistent with the classification defined in section &#x201C;New Relaxase Families Related to RCR Initiator Proteins in IMEs&#x201D; (<bold>Table <xref ref-type="table" rid="T2">2</xref></bold>). Tyrosine integrases were found in all IMEs encoding non-canonical relaxases related to RCR initiators, i.e., (i) a Rel_PF02486/MobT relaxase or (ii) relaxases from the four new superfamilies identified in this study. On the other hand, serine integrases were found in all IMEs encoding relaxase from canonical Rel_PF03389/MobQ, Rel_PF13814/MobC, Rel_PF01076/MobV (in the absence of Rel_PF02486/MobT relaxase) and Rel_PF03432/MobP superfamilies. Furthermore, IMEs encoding a single Rel_PF02486/MobT or a relaxase belonging to one of the four new superfamilies also encode either TcpA or no CP. TcpA CPs were never found in IMEs containing one of the canonical relaxases (Rel_PF03389/MobQ, Rel_PF13814/MobC, Rel_PF01076/MobV (alone or with Rel_PF02486/MobT) and Rel_PF03432/MobP). These IMEs contain either no CPs (MobQ, MobV, and MobP) or CPs from the VirD4 superfamily (MobC).</p>
<p>An illustration of all possible ternary Integrase&#x2013;Relaxase&#x2013;CP associations in our collection of 144 IMEs is shown in <bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>. For each type of signature protein, the families identified by phylogenetic analyses and clustering at 40% identity are represented by arcs on the circle. The numbers of members in each family are reported in black. The numbers of clusters of sequences sharing more than 90% identity are reported in gray on each arc in order to estimate the sequence diversity in each family of signature protein. Apart from signature protein families with few representatives (<italic>n</italic> &#x003C; 3) or with low diversity (90% identity clusters &#x003C;3), this analysis of the co-occurrence of the different families of integrases, CPs, and relaxases (<bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>) reveals no exclusive associations. Altogether, 39 different ternary associations were observed suggesting a high frequency of shuffling between signature proteins.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p><bold>Co-occurrence of relaxases, CPs and integrases among IMEs.</bold> Arcs group proteins belonging to the same family according to phylogenetic analysis and 40% sequence identity clustering: red, green, and blue arcs for clustered integrases, relaxases, and CPs, respectively. Ribbons indicate the association between integrases and relaxases in red, relaxases and CPs in green and CPs and integrases in blue. Numbers in black show the number of IMEs belonging to the same family. Numbers in gray show the number of 90% sequence identity clusters within the family.</p></caption>
<graphic xlink:href="fmicb-08-00443-g003.tif"/>
</fig>
</sec>
<sec><title>Organization of Conserved CDSs in IMEs: Predominance of a Common Compact Structure</title>
<p>For a better characterization of the IMEs, a search for conserved CDSs in IMEs encoding the same superfamily of relaxases was undertaken. The various conserved CDS architectures are schematized in <bold>Figure <xref ref-type="fig" rid="F4">4</xref></bold>. Apart from IME_Class_10, the IMEs with a tyrosine integrase encode a unique non-canonical relaxase (Rel_PF02486/MobT, Rel_PF01719, Rel_PHA00330, Rel_PF01719-PF00910, and Rel_PF02407). These IMEs display a compact structure composed of successive genes (relaxase, excisionase, and integrase), generally preceded by a TcpA gene (83/118). Interestingly, the same compact structure was found in IME_Class_8, even if the encoded proteins are not related (a VirD4 CP instead of a TcpA CP, a canonical Rel_PF13814/MobC relaxase instead of relaxase related to RCR initiators and a serine integrase instead of tyrosine integrase).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p><bold>Conserved CDS architectures within IMEs.</bold> The classification of IMEs is based on their relaxase content (see also <bold>Table <xref ref-type="table" rid="T2">2</xref></bold>). The genes encoding conserved proteins in all IMEs sharing the same relaxase superfamily are indicated by arrows. The genes between brackets correspond to non-conserved genes located between conserved ones. The numerical values show the numbers of IMEs sharing the same structure.</p></caption>
<graphic xlink:href="fmicb-08-00443-g004.tif"/>
</fig>
<p>All other classes of IMEs encode other types of canonical relaxases and do not encode a CP. In IME_Class_10, the two genes encoding relaxases (a canonical Rel_PF01076/MobV and a non-canonical Rel_PF02486/MobT) are located far upstream of the tyrosine integrase gene in the opposite orientation. As well as the two relaxases and a tyrosine integrase, these IMEs encode a protein with a repA_N domain that is also found in proteins that initiates the theta replication of plasmids and of ICEs belonging to the Tn<italic>5252</italic> superfamily from firmicutes (<xref ref-type="bibr" rid="B49">Weaver et al., 2009</xref>; <xref ref-type="bibr" rid="B21">Guerillot et al., 2013</xref>; <xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). However, repA_N proteins from IMEs are shorter (&#x223C;100 amino acids) than those found in plasmids and ICEs (&#x223C;340 amino acids), suggesting that they probably serve a different function.</p>
<p>Apart from IME_Class_8, all IMEs encoding a serine integrase and relaxases from canonical superfamilies (Rel_PF03389/MobQ, Rel_PF01076/MobV, and Rel_PF03432/MobP) also encode one or several proteins that could be involved in the maintenance of the excised elements. These proteins include homologs to: (i) &#x2018;replisome organizers&#x2019; or &#x2018;DnaC-related&#x2019; proteins involved in the initiation of theta replication of various phages from Firmicutes such as phi5218, phi4268, or phi9871 (<xref ref-type="bibr" rid="B48">Trotter et al., 2006</xref>; <xref ref-type="bibr" rid="B47">Tang et al., 2013</xref>; <xref ref-type="bibr" rid="B32">McDonnell et al., 2016</xref>), (ii) &#x2018;ParB&#x2019; proteins involved in chromosome and plasmid partitioning (domain TIGR00180) (<bold>Figure <xref ref-type="fig" rid="F4">4</xref></bold>). Such proteins are not encoded by any other class of IMEs analyzed in this study.</p>
<p>In summary, whereas the analysis of IME signature proteins shows a remarkable diversity, preventing their classification on the basis of their relationships, the analysis of their CDS organization shows that most of them (IME_Class_1, _2, _3, _4, _7, and _8, representing 120/144 IMEs) harbor a similar compact organization. This conserved compact organization was observed for all the IMEs encoding a single relaxase related to RCR initiators (Rel_PF02486/MobT type and four other new superfamilies discovered in this study) and for all IMEs encoding a CP (TcpA or VirD4).</p>
</sec>
<sec><title>Modular Evolution of IMEs</title>
<p>Sequence comparison of IMEs suggests that most of the exchanges of modules or CP-encoding genes occur between IMEs with similar structures, especially between elements harboring the compact structure described above. <bold>Figure <xref ref-type="fig" rid="F5">5</xref></bold> illustrates two such situations involving IME_Class_2 and IME_Class_7 (<bold>Figure <xref ref-type="fig" rid="F5">5A</xref></bold>), and IME_Class_3 and IME_Class1 (<bold>Figure <xref ref-type="fig" rid="F5">5B</xref></bold>). In the first example, two members of IME_Class_2 (named here IME_<italic>A1</italic> and IME_<italic>A2</italic> for simplicity), exhibit a closely related mobilization module but their integration/excision modules are very different. Moreover, the integration module of IME_<italic>A2</italic> is related to that of IME_<italic>A3</italic> (from IME_Class_7) suggesting a probable exchange of integration modules between IMEs. In the second example, IME_<italic>B2</italic> and IME_<italic>B3</italic> (from IME_Class_1) have related integration and mobilization modules with the exception of their CP. However, the TcpA encoded by IME_<italic>B2</italic> is related to the one encoded by IME_<italic>B1</italic> (from IME_Class3). These data point to an exchange of genes encoding TcpA CPs between IMEs encoding different types of CPs and integrases.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p><bold>Modular evolution of IMEs. (A)</bold> Sequence comparison of IME_<italic>A2</italic> with IME_<italic>A1</italic> and IME_<italic>A3</italic>. <bold>(B)</bold> Sequence comparison of IME_<italic>B2</italic> with IME_<italic>B1</italic> and IME_<italic>B3</italic>. Percentages of nucleic identities are shown in gray. Blue: genes encoding conserved proteins of the mobilization module. Red or pink: genes encoding conserved proteins of integration/excision module. Orange: other genes. IME_<italic>A1</italic> = IME_<italic>SdyRE378_rpsI</italic>, IME_<italic>A2</italic> = IME_<italic>SanC238_rpmG, IME_A3</italic> = IME_<italic>Sag201008_rpmG</italic>, IME_<italic>B1</italic> = IME_<italic>Spas43144_rpsI</italic>, IME_<italic>B2</italic> = IME_<italic>SanMAS624_tRNAlys and</italic> IME_<italic>B3</italic> = IME_<italic>SpnOXC141_rpmG.</italic></p></caption>
<graphic xlink:href="fmicb-08-00443-g005.tif"/>
</fig>
</sec>
</sec>
<sec><title>Discussion</title>
<sec><title>Prevalence and Diversity of IMEs</title>
<p>Integrative and mobilizable elements are by far the least known elements that transfer by conjugation. Indeed, until now, very little information on their prevalence has been available. Considering their diversity, very few IMEs with different mobilization and/or recombination modules have been reported (only 15 in 2013, see <xref ref-type="bibr" rid="B7">Bellanger et al., 2014</xref> for a review). Here, we identified all IMEs carried by 124 genomes from 27 species of <italic>Streptococcus</italic> and compared their abundance and diversity to those of ICEs previously identified in the same set of strains (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). We demonstrated that IMEs have a very high prevalence and are about 40% more abundant than ICEs. We also found that the mobilization modules of IMEs display a larger diversity than the conjugation modules of ICEs.</p>
<p>Only 20% of our collection of streptococcal IMEs encode canonical relaxases (i.e., belong to the Rel_PF03389/MobQ, Rel_PF01076/MobV, Rel_PF13814/MobC, or Rel_PF03432/MobP superfamilies), already found to be encoded by conjugative and mobilizable elements from G- bacteria (<xref ref-type="bibr" rid="B17">Garcillan-Barcia et al., 2009</xref>). Among them, none encode any CP (IME_Class_5, _6, and _9) except the two IMEs with a Rel_PF13814/MobC relaxase (IME_Class_8) that encode a canonical VirD4 CP. This is reminiscent of mobilizable plasmids of G- bacteria and firmicutes (<xref ref-type="bibr" rid="B17">Garcillan-Barcia et al., 2009</xref>).</p>
<p>Unexpectedly, the large majority (90%, <italic>n</italic> = 129/144) of streptococcal IMEs in our collection encode non-canonical relaxases (Rel_PF02486/MobT, Rel_PF01719, Rel_PHA00330, Rel_PF01719-PF00910, and Rel_PF02407) related to proteins responsible for RCR initiation involved in the maintenance of plasmids from firmicutes or viruses. MobT was previously identified in a few predicted IMEs (<xref ref-type="bibr" rid="B7">Bellanger et al., 2014</xref>) and in ICEs belonging to the Tn<italic>916</italic> superfamily (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). The four other superfamilies of putative relaxases are unrelated to any known relaxase of mobilizable or conjugative elements. It should be emphasized that the MobT &#x201C;relaxase&#x201D; of the integrative and conjugative element ICE<italic>Bs1</italic> from the firmicute <italic>Bacillus subtilis</italic> is involved in not only the initiation of the conjugative transfer of ICE<italic>Bs1</italic> but also the initiation of RCR needed for the maintenance of ICE<italic>Bs1</italic> after excision (<xref ref-type="bibr" rid="B28">Lee et al., 2010</xref>). In the same way, another family of &#x201C;RCR initiators&#x201D; exhibiting a Rep_1/PF01446 domain is involved not only in the maintenance of three plasmids from firmicutes but also in their mobilization by ICE<italic>Bs1</italic> (<xref ref-type="bibr" rid="B29">Lee et al., 2012</xref>). Therefore, the classical distinction between RCR initiators and relaxases could lose its relevance. In IMEs encoding a CP (<italic>n</italic> = 85/144), RCR initiator-related relaxases are always associated with a non-canonical TcpA CP. The strict association of RCR initiator and TcpA is also observed in conjugative elements encoding a RCR relaxase (i.e., the ICEs belonging to the Tn<italic>916/</italic>ICE<italic>Bs1</italic>/ICE<italic>St3</italic> from firmicutes) (<xref ref-type="bibr" rid="B22">Guglielmini et al., 2013</xref>; <xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). In these IMEs and ICEs, the <italic>tcpA</italic> gene is located upstream from the RCR &#x201C;relaxase&#x201D; gene. Taken together, these findings reveal that non-canonical relaxases related to four types of RCR initiators and non-canonical CPs related to FtsK DNA translocase are involved in the mobilization of most streptococcal IMEs.</p>
<p>FtsK-related proteins were previously found to be encoded by various small plasmids mainly from firmicutes (see for examples, NCBI reference sequences NP_203541, NP_613077, YP_251910, WP_011669127, YP_001967631, YP_006939188) but they were never proposed to be mobilization CPs (see for example <xref ref-type="bibr" rid="B5">Bachrach et al., 2004</xref>; <xref ref-type="bibr" rid="B8">Bjorland et al., 2007</xref>; <xref ref-type="bibr" rid="B42">Shkoporov et al., 2008</xref>). However, according to our analysis using CONJscan-T4SSscan, all these proteins belong to the TcpA family. Interestingly, none of these plasmids encode a canonical relaxase. Rather, they carry a &#x201C;RCR initiator&#x201D; gene (located next to the <italic>tcpA</italic>) encoding either one of the domains found in IME relaxases or a PF01446 domain (i.e., the domain found in RCR initiator/relaxases from the small plasmids mobilized by ICE<italic>Bs1</italic>). Therefore, it seems highly probable that these small plasmids are mobilizable. As previously proposed by <xref ref-type="bibr" rid="B29">Lee et al. (2012)</xref>, it is probable that at least some of the small plasmids from firmicutes encoding a &#x201C;RCR initiator&#x201D; and lacking any canonical relaxase gene, CP, or T4SS protein, could be also mobilizable. Finally, it should also be noted that many plasmids devoid of relaxase could also carry an <italic>oriT</italic> related to those of conjugative element and therefore could be mobilizable <italic>in trans</italic>, as recently found for most plasmids from staphylococci (<xref ref-type="bibr" rid="B35">O&#x2019;Brien et al., 2015</xref>; <xref ref-type="bibr" rid="B37">Pollet et al., 2016</xref>). Taken together, all these data point to a previous underestimation of the number of mobilizable plasmids and instead support their very high prevalence.</p>
<p>Besides IMEs and ICEs, our analysis of streptococcal genomes reveals many elements that (i) are flanked by DRs and (ii) encode an integrase but (iii) are devoid of CP and of canonical or RCR initiator-related relaxase (data not shown). At least some of these could correspond to IMEs. This hypothesis is supported first by the discovery of a novel type of relaxase related to tyrosine recombinases that is encoded by the pCW3 conjugative plasmid from the firmicute <italic>C. perfringens</italic> (<xref ref-type="bibr" rid="B50">Wisniewski et al., 2016</xref>). Second, in proteobacteria, IMEs devoid of relaxase but carrying an <italic>oriT</italic> are found to be mobilizable (<xref ref-type="bibr" rid="B14">Daccord et al., 2010</xref>) and one such IME (IME MTn<italic>Sag1</italic>) have previously been described in <italic>S. agalactiae</italic> (<xref ref-type="bibr" rid="B1">Achard and Leclercq, 2007</xref>). Thus, the prevalence and diversity of IMEs within analyzed streptococcal genomes could be even greater than that described here.</p>
</sec>
<sec><title>Modular and Intramodular Evolution</title>
<p>The comparison of phylogenetic analyses of integrases with those of relaxases and CPs reveals many inconsistencies, probably due to multiple replacements of integration/excision or mobilization modules between IMEs. Such replacements were previously observed in streptococcal ICEs (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>). The phylogenetic analysis of integrase families (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold> and <bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S1</xref></bold>) clearly shows that replacement of integration/excision modules can occur not only between IMEs or between ICEs but also between ICEs and IMEs.</p>
<p>Within the mobilization modules encoding non-canonical relaxases, the comparison of phylogenetic analyses and/or co-occurrence of relaxases and TcpA CPs reveals inconsistencies. Thus, 10 out of 25 IMEs encoding a MobT relaxase that belong the PF02486_6 family do not carry a <italic>tcpA</italic> gene or pseudogene, whereas the 15 others have one. The distribution of these latter suggests that an ancestral IME devoid of TcpA has recently acquired a <italic>tcpA</italic> gene. On the contrary, among IMEs encoding relaxases belonging to the PF01719, PF1719-PF00910, and PHA00330 superfamilies, only 13 do not encode a TcpA and probably lost their <italic>tcpA</italic> by deletion. In some cases, almost identical IME relaxases (see for example the Rel_PF02486_6 cluster in <bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM2">S2</xref></bold>) are associated with TcpA from different families suggesting that intramodular gene replacements occurred. In most cases, the data does not allow us to determine precisely what happened. However, the phylogenetic tree of the PF02486_6 relaxases suggests a replacement of a TcpA_5 CP by a TcpA_6 CP. Interestingly, although two superfamilies of relaxase (Rel_PF02486/MobT and Rel_PF03432/MobP) and the two superfamilies of CPs (VirD4 and TcpA) are shared by ICEs and IMEs from streptococci, there is no evidence of exchange of these genes between ICEs and IMEs.</p>
<p>Various IMEs integrated in <italic>rpsI</italic>, <italic>rpmG</italic>, and <italic>rplL</italic> were found to be integrated in tandem with other IMEs or ICEs encoding either related, distantly related, or unrelated integrases, relaxases, and/or CPs. We have also found many decayed elements or genomic islands in accretion with streptococcal IMEs (data not shown). These accretions result from the integration of an incoming IME or ICE by site-specific recombination in the <italic>attL</italic> or <italic>attR</italic> site of related or unrelated resident element that may not be followed by a deletion (<xref ref-type="bibr" rid="B36">Pavlovic et al., 2004</xref>; <xref ref-type="bibr" rid="B6">Bellanger et al., 2011</xref>). An accretion between elements targeting the same insertion gene and subsequent deletion of one of the transfer modules and one of the recombination modules is probably responsible for a large part of the replacement of modules or TcpA genes.</p>
</sec>
<sec><title>Are TcpA CP Needed or not for Mobilization?</title>
<p>In fact, the non-canonical TcpA superfamily of CPs was previously reported to be encoded by conjugation modules from firmicutes, but TcpA has not yet been found in a mobilization module. In conjugative elements, TcpA proteins are associated with non-canonical relaxases: (i) the relaxase of the conjugative pCW3 plasmid from <italic>C. perfringens</italic> that is related to tyrosine recombinases (<xref ref-type="bibr" rid="B50">Wisniewski et al., 2016</xref>) or (ii) the MobT relaxases from the ICEs belonging to ICE<italic>Bs1</italic>/Tn<italic>916</italic>/ICE<italic>St3</italic> superfamily that are related to RCR initiators. In this work, we identified many IMEs encoding a TcpA CP: all of them encode a non-canonical relaxase. Although all IMEs encoding a non-canonical relaxase have a similar organization, their mobilization modules are highly versatile. First, closely related relaxases can be associated or not with a TcpA CP, suggesting that IME-encoded CP might not be needed for mobilization. If so, it can be hypothesized that the non-canonical relaxase might interact with the T4SS of the mobilizing conjugative element, either <italic>via</italic> the CP encoded by the conjugative element or <italic>via</italic> its cognate CP. In this hypothesis, the IME-encoded TcpA might enhance the mobilization efficiency and/or enlarge the mobilization range. Second, closely related relaxases can be associated with different distantly related TcpA CPs, indicating that the IME relaxase can interact with distantly related CPs. We hypothesize that the change of CP might have an impact on the mobilization efficiency and/or range.</p>
</sec>
<sec><title>IMEs within ICEs, a New Mobilization Mechanism?</title>
<p>The IMEs from streptococci carry diverse recombination modules and have a large array of integration specificity. Almost all serine integrases from IMEs catalyze site-specific integration within genes leading to their disruption. Interestingly, the majority of IME serine integrases (12/16) specifically target several conserved genes from the Tn<italic>5252</italic> superfamily, a group of ICEs that is widespread in streptococci. As previously discussed for ICEs (<xref ref-type="bibr" rid="B3">Ambroset et al., 2016</xref>), we would expect that target specificity should be selected to have the least effect on host fitness. Here, the disruption of a conjugation gene would have little or no effect on bacterial host but would be deleterious or lethal for the host ICE. For instance, insertion in <italic>traG</italic>, that encodes a VirD4 CP, would abolish the ICE transfer and therefore the mobilization of the IME by the host ICE. The consequences of the integration/excision balance of ICE or IME encoding serine recombinases have never been studied but are documented for some prophages encoding serine recombinase. For these prophages, excision occurs not only during the activation of lytic phase but also when expression of the host target gene is needed (<xref ref-type="bibr" rid="B27">Kunkel et al., 1990</xref>; <xref ref-type="bibr" rid="B39">Rabinovich et al., 2012</xref>). By analogy, we can hypothesize that excision of IMEs integrated within specific conjugation genes of ICEs would be caused by the induction of conjugation. After IME excision, the conjugation module would be functional and could be expressed, thus allowing ICE transfer. The IME could use the CP and T4SS of this ICE to transfer and then could integrate in the ICE in the transconjugant. Furthermore, if the ICE that primarily hosts the IME does not transfer or integrate in the recipient cell, the incoming IME could integrate in another resident element (related ICE or decayed ICE as long as it carries the IME integration site). This would explain the presence of such IMEs in many decayed ICEs from streptococci. ICE<italic>Sp2905</italic> from <italic>S. pyogenes</italic>, an ICE integrated in <italic>rumA</italic>, was demonstrated to transfer (<xref ref-type="bibr" rid="B19">Giovanetti et al., 2012</xref>) although it carries two IMEs: one integrated in <italic>snf2</italic> and the other in <italic>maff2</italic> (<xref ref-type="bibr" rid="B7">Bellanger et al., 2014</xref>). Although we cannot exclude that the disrupted genes are not required for ICE transfer, we can also hypothesize that the transfer could be divided into successive stages including excisions of the ICE and IMEs, independent transfers of the IMEs and of the ICE devoid of IMEs, insertions of the transferred ICE in <italic>rumA</italic> site and insertion of the IMEs within the transferred ICE. Such a mobilization mechanism of an IME integrated in an ICE can also be proposed for IMEs encoding tyrosine integrases that are site-specifically integrated in the putative <italic>oriT</italic> from ICEs belonging to Tn<italic>916</italic> and ICE<italic>St3</italic> families that were found in <italic>S. agalactiae</italic> and in <italic>S. mutans</italic> (<xref ref-type="bibr" rid="B38">Puymege et al., 2015</xref>).</p>
</sec>
<sec><title>Replication of Excised IMEs</title>
<p>Integrative and mobilizable elements and ICEs are integrated in the chromosome and are transmitted to the daughter cell as part of the chromosome. However, an excised IME would be lost in one of the daughter cell during cell division in the absence of replication. Several recent studies indicated that extrachromosomal replication is involved in the maintenance of various ICEs transferring as single-strand DNA (<xref ref-type="bibr" rid="B40">Ramsay et al., 2006</xref>; <xref ref-type="bibr" rid="B29">Lee et al., 2012</xref>; <xref ref-type="bibr" rid="B21">Guerillot et al., 2013</xref>; <xref ref-type="bibr" rid="B12">Carraro et al., 2015</xref>), but data suggesting replication of excised IMEs has not been reported so far. All streptococcal IMEs encoding a Rel_PF03432/MobP relaxase and most of those encoding a Rel_PF03389/MobQ carry one or two genes encoding proteins downstream from the relaxase gene that are distantly related to primosome proteins. Such proteins are known to be responsible for the initiation of the theta replication of prophages. Altogether, these data suggest that these IMEs are able to replicate with a theta mechanism after excision. Ten other IMEs (IME_Class_10 family) sharing a similar organization encode two putative relaxases. One belongs to Rel_PF02486/MobT superfamily, i.e., a family including both RCR initiators and relaxases. The other belongs to Rel_PF01076/MobV family. The structure of the region carrying these genes is reminiscent of the one of numerous mobilizable plasmids from firmicutes where the Rel_PF01076/MobV protein was found to be involved in mobilization whereas the Rel_PF02486/MobT protein is involved in RCR (<xref ref-type="bibr" rid="B31">Lorenzo-Diaz et al., 2014</xref>). Accordingly, the Rel_PF01076/MobV protein of an IME of the IME_Class_10 family was very recently shown to be a mobilization relaxase (<xref ref-type="bibr" rid="B30">Lorenzo-Diaz et al., 2016</xref>). Therefore, it is likely that the Rel_PF01076/MobV protein is the IME relaxase, whereas the Rel_PF02486/MobT protein would be involved in RCR replication of the excised IME. Alternatively, as previously found for the MobT relaxase of ICE<italic>Bs1</italic> (<xref ref-type="bibr" rid="B29">Lee et al., 2012</xref>), the Rel_PF02486/MobT protein could ensure both functions. Finally, all IMEs encoding a single Rel_PF01076/MobV relaxase encode a protein related to the ParB proteins that could be involved in the partition of the excised IME. Taken together, these data suggest that almost all streptococcal IMEs encoding canonical relaxases (except the two elements encoding a MobC relaxase) encode proteins involved in the maintenance of their excised forms. Such proteins were not found for any IME encoding single non-canonical relaxases such as MobT. Since the MobT protein from ICE<italic>Bs1</italic> is both the relaxase and the initiator of RCR involved in the maintenance of excised ICE<italic>Bs1</italic> (<xref ref-type="bibr" rid="B29">Lee et al., 2012</xref>), we cannot exclude the possibility that the five superfamilies of non-canonical relaxases might have both functions. Overall, many if not all IMEs and ICEs might exist in two states, namely a main dormant integrated state and an activated excised state which would be maintained by replication.</p>
</sec>
</sec>
<sec><title>Author Contributions</title>
<p>GG and SP conceived the reference database of signature proteins. CC, NL-B, GG, and M-DD contributed to the conception of the work. CC, GG, NL-B, CA, M-DD, VL, and TL performed the acquisition and analysis of the data. GG, NL-B, CC, and M-DD drafted the manuscript. CC, NL-B, GG, and SP elaborated the figures, tables, and references. All authors criticized and finally approved the final version of the manuscript.</p>
</sec>
<sec><title>Conflict of Interest Statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> This work was supported by the R&#x00E9;gion Lorraine and the Universit&#x00E9; de Lorraine.</p></fn>
</fn-group>
<ack>
<p>CC is recipient of a scholarship of the Minist&#x00E8;re de l&#x2019;Enseignement Sup&#x00E9;rieur et de la Recherche.</p>
</ack>
<sec sec-type="supplementary material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="http://journal.frontiersin.org/article/10.3389/fmicb.2017.00443/full#supplementary-material">http://journal.frontiersin.org/article/10.3389/fmicb.2017.00443/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image_1.TIF" id="SM1" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S1</label>
<caption><p><bold>Phylogenetic tree of serine integrases.</bold> One representative of each 90% protein identity cluster from IMEs (in black) and one representative of each 90% protein identity cluster of serine integrases from ICEs targeting the same site as IMEs (in mauve and underlined) are presented in the ML tree. Bootstrap values (BioNJ/ML) are given only when they exceed 50 for both analyses. The target gene is mentioned in the IME/ICE names. Serine integrases sharing more than 40% identity and therefore belonging to the same family are merged with brackets. These families are distinguished with different numbers. Refer to Supplementary Table <xref ref-type="supplementary-material" rid="SM7">S1</xref> for IME and strain details.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_1.TIF" id="S1" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_2.TIF" id="SM2" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S2</label>
<caption><p><bold>Phylogenetic tree of Rel_PF02486/MobT relaxases.</bold> All the Rel_PF02486/MobT relaxases from IMEs (in black) and only one representative of each 90% protein identity cluster of MobT relaxases from ICEs (in mauve and underlined) are presented in the ML tree. Bootstrap values (BioNJ/ML) are given only when they exceed 50 for both analyses. Relaxases sharing more than 40% sequence identity and therefore belonging to the same family are merged with brackets. These families are distinguished with a number preceded by the Pfam identifier of the characteristic domain of this superfamily. The TcpA family associated with each relaxase is indicated.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_2.TIF" id="S2" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_3.TIF" id="SM3" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S3</label>
<caption><p><bold>Phylogenetic tree of Rel_PF01719 relaxases.</bold> All the Rel_PF01719 relaxases are presented in the ML tree. Bootstrap values (BioNJ/ML) are given only when they exceed 50 for both analyses. All these relaxases share more than 40% sequence identity and therefore belong to a unique family. The TcpA family associated with each relaxase is indicated.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_3.TIF" id="S3" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_4.TIF" id="SM4" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S4</label>
<caption><p><bold>Phylogenetic tree of Rel_PHA00330 relaxases.</bold> All the Rel_PHA00330 relaxases are presented in the ML tree. Bootstrap values (BioNJ/ML) are given only when they exceed 50 for both analyses. The relaxases sharing more than 40% sequence identity and therefore belonging to the same family are merged with brackets. These families are distinguished with a number preceded by the identifier of the characteristic domain of this superfamily. The TcpA family associated with each relaxase is indicated.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_4.TIF" id="S4" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_5.TIF" id="SM5" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S5</label>
<caption><p><bold>Phylogenetic tree of Rel_PF01719-PF00910 relaxases.</bold> All the Rel_PF01719-PF00910 relaxases are presented in the ML tree. Bootstrap values (BioNJ/ML) are given only when they exceed 50 for both analyses. The relaxases sharing more than 40% sequence identity and therefore belonging to the same family are merged with brackets. These families are distinguished with a number preceded by the pfam identifier of the characteristic domains of this superfamily. The TcpA family associated with each relaxase is indicated.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_5.TIF" id="S5" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_6.TIF" id="SM6" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S6</label>
<caption><p><bold>Phylogenetic tree of TcpA proteins.</bold> All the TcpA CPs from IMEs (in black) and one of each 90% protein identity cluster of TcpA from ICEs (in mauve and underlined) are presented in the BioNJ tree. Bootstrap values are given only when they exceed 50. The TcpA CPs sharing more than 40% sequence identity and therefore belonging to the same family are merged with brackets. These families are distinguished with different numbers. The relaxases families associated with each TcpA family are indicated.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_6.TIF" id="S6" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_1.XLSX" id="SM7" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Achard</surname> <given-names>A.</given-names></name> <name><surname>Leclercq</surname> <given-names>R.</given-names></name></person-group> (<year>2007</year>). <article-title>Characterization of a small mobilizable transposon, MTnSag1, in <italic>Streptococcus agalactiae</italic>.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>189</volume> <fpage>4328</fpage>&#x2013;<lpage>4331</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00213-07</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alva</surname> <given-names>V.</given-names></name> <name><surname>Nam</surname> <given-names>S. Z.</given-names></name> <name><surname>Soding</surname> <given-names>J.</given-names></name> <name><surname>Lupas</surname> <given-names>A. N.</given-names></name></person-group> (<year>2016</year>). <article-title>The MPI bioinformatics Toolkit as an integrative platform for advanced protein sequence and structure analysis.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>44</volume> <fpage>W410</fpage>&#x2013;<lpage>W415</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw348</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ambroset</surname> <given-names>C.</given-names></name> <name><surname>Coluzzi</surname> <given-names>C.</given-names></name> <name><surname>Guedon</surname> <given-names>G.</given-names></name> <name><surname>Devignes</surname> <given-names>M. D.</given-names></name> <name><surname>Loux</surname> <given-names>V.</given-names></name> <name><surname>Lacroix</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>New insights into the classification and integration specificity of <italic>Streptococcus</italic> integrative conjugative elements through extensive genome exploration.</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>6</volume>:<issue>1483</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2015.01483</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Auchtung</surname> <given-names>J. M.</given-names></name> <name><surname>Aleksanyan</surname> <given-names>N.</given-names></name> <name><surname>Bulku</surname> <given-names>A.</given-names></name> <name><surname>Berkmen</surname> <given-names>M. B.</given-names></name></person-group> (<year>2016</year>). <article-title>Biology of ICEBs1, an integrative and conjugative element in <italic>Bacillus subtilis</italic>.</article-title> <source><italic>Plasmid</italic></source> <volume>86</volume> <fpage>14</fpage>&#x2013;<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1016/j.plasmid.2016.07.001</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bachrach</surname> <given-names>G.</given-names></name> <name><surname>Haake</surname> <given-names>S. K.</given-names></name> <name><surname>Glick</surname> <given-names>A.</given-names></name> <name><surname>Hazan</surname> <given-names>R.</given-names></name> <name><surname>Naor</surname> <given-names>R.</given-names></name> <name><surname>Andersen</surname> <given-names>R. N.</given-names></name><etal/></person-group> (<year>2004</year>). <article-title>Characterization of the novel <italic>Fusobacterium nucleatum</italic> plasmid pKH9 and evidence of an addiction system.</article-title> <source><italic>Appl. Environ. Microbiol.</italic></source> <volume>70</volume> <fpage>6957</fpage>&#x2013;<lpage>6962</lpage>. <pub-id pub-id-type="doi">10.1128/AEM.70.12.6957-6962.2004</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bellanger</surname> <given-names>X.</given-names></name> <name><surname>Morel</surname> <given-names>C.</given-names></name> <name><surname>Gonot</surname> <given-names>F.</given-names></name> <name><surname>Puymege</surname> <given-names>A.</given-names></name> <name><surname>Decaris</surname> <given-names>B.</given-names></name> <name><surname>Guedon</surname> <given-names>G.</given-names></name></person-group> (<year>2011</year>). <article-title>Site-specific accretion of an integrative conjugative element together with a related genomic island leads to cis mobilization and gene capture.</article-title> <source><italic>Mol. Microbiol.</italic></source> <volume>81</volume> <fpage>912</fpage>&#x2013;<lpage>925</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2958.2011.07737.x</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bellanger</surname> <given-names>X.</given-names></name> <name><surname>Payot</surname> <given-names>S.</given-names></name> <name><surname>Leblond-Bourget</surname> <given-names>N.</given-names></name> <name><surname>Guedon</surname> <given-names>G.</given-names></name></person-group> (<year>2014</year>). <article-title>Conjugative and mobilizable genomic islands in bacteria: evolution and diversity.</article-title> <source><italic>FEMS Microbiol. Rev.</italic></source> <volume>38</volume> <fpage>720</fpage>&#x2013;<lpage>760</lpage>. <pub-id pub-id-type="doi">10.1111/1574-6976.12058</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bjorland</surname> <given-names>J.</given-names></name> <name><surname>Bratlie</surname> <given-names>M. S.</given-names></name> <name><surname>Steinum</surname> <given-names>T.</given-names></name></person-group> (<year>2007</year>). <article-title>The smr gene resides on a novel plasmid pSP187 identified in a <italic>Staphylococcus pasteuri</italic> isolate recovered from unpasteurized milk.</article-title> <source><italic>Plasmid</italic></source> <volume>57</volume> <fpage>145</fpage>&#x2013;<lpage>155</lpage>. <pub-id pub-id-type="doi">10.1016/j.plasmid.2006.08.004</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brochet</surname> <given-names>M.</given-names></name> <name><surname>Couve</surname> <given-names>E.</given-names></name> <name><surname>Glaser</surname> <given-names>P.</given-names></name> <name><surname>Guedon</surname> <given-names>G.</given-names></name> <name><surname>Payot</surname> <given-names>S.</given-names></name></person-group> (<year>2008</year>). <article-title>Integrative conjugative elements and related elements are major contributors to the genome diversity of <italic>Streptococcus agalactiae</italic>.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>190</volume> <fpage>6913</fpage>&#x2013;<lpage>6917</lpage>.<pub-id pub-id-type="doi">10.1128/JB.00824-08</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Burrus</surname> <given-names>V.</given-names></name> <name><surname>Pavlovic</surname> <given-names>G.</given-names></name> <name><surname>Decaris</surname> <given-names>B.</given-names></name> <name><surname>Guedon</surname> <given-names>G.</given-names></name></person-group> (<year>2002</year>). <article-title>Conjugative transposons: the tip of the iceberg.</article-title> <source><italic>Mol. Microbiol.</italic></source> <volume>46</volume> <fpage>601</fpage>&#x2013;<lpage>610</lpage>.</citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cabezon</surname> <given-names>E.</given-names></name> <name><surname>Ripoll-Rozada</surname> <given-names>J.</given-names></name> <name><surname>Pena</surname> <given-names>A.</given-names></name> <name><surname>De La Cruz</surname> <given-names>F.</given-names></name> <name><surname>Arechaga</surname> <given-names>I.</given-names></name></person-group> (<year>2015</year>). <article-title>Towards an integrated model of bacterial conjugation.</article-title> <source><italic>FEMS Microbiol. Rev.</italic></source> <volume>39</volume> <fpage>81</fpage>&#x2013;<lpage>95</lpage>. <pub-id pub-id-type="doi">10.1111/1574-6976.12085</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carraro</surname> <given-names>N.</given-names></name> <name><surname>Poulin</surname> <given-names>D.</given-names></name> <name><surname>Burrus</surname> <given-names>V.</given-names></name></person-group> (<year>2015</year>). <article-title>Replication and active partition of integrative and conjugative elements (ICEs) of the SXT/R391 family: the line between ICEs and conjugative plasmids is getting thinner.</article-title> <source><italic>PLoS Genet.</italic></source> <volume>11</volume>:<issue>e1005298</issue>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1005298</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chandran Darbari</surname> <given-names>V.</given-names></name> <name><surname>Waksman</surname> <given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>Structural biology of bacterial type IV secretion systems.</article-title> <source><italic>Annu. Rev. Biochem.</italic></source> <volume>84</volume> <fpage>603</fpage>&#x2013;<lpage>629</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-biochem-062911-102821</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Daccord</surname> <given-names>A.</given-names></name> <name><surname>Ceccarelli</surname> <given-names>D.</given-names></name> <name><surname>Burrus</surname> <given-names>V.</given-names></name></person-group> (<year>2010</year>). <article-title>Integrating conjugative elements of the SXT/R391 family trigger the excision and drive the mobilization of a new class of <italic>Vibrio</italic> genomic islands.</article-title> <source><italic>Mol. Microbiol.</italic></source> <volume>78</volume> <fpage>576</fpage>&#x2013;<lpage>588</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2958.2010.07364.x</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ebisu</surname> <given-names>S.</given-names></name> <name><surname>Murahashi</surname> <given-names>Y.</given-names></name> <name><surname>Takagi</surname> <given-names>H.</given-names></name> <name><surname>Kadowaki</surname> <given-names>K.</given-names></name> <name><surname>Yamaguchi</surname> <given-names>K.</given-names></name> <name><surname>Yamagata</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>1995</year>). <article-title>Nucleotide sequence and replication properties of the <italic>Bacillus borstelensis</italic> cryptic plasmid pHT926.</article-title> <source><italic>Appl. Environ. Microbiol.</italic></source> <volume>61</volume> <fpage>3154</fpage>&#x2013;<lpage>3157</lpage>.</citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Francia</surname> <given-names>M. V.</given-names></name> <name><surname>Varsaki</surname> <given-names>A.</given-names></name> <name><surname>Garcillan-Barcia</surname> <given-names>M. P.</given-names></name> <name><surname>Latorre</surname> <given-names>A.</given-names></name> <name><surname>Drainas</surname> <given-names>C.</given-names></name> <name><surname>De La Cruz</surname> <given-names>F.</given-names></name></person-group> (<year>2004</year>). <article-title>A classification scheme for mobilization regions of bacterial plasmids.</article-title> <source><italic>FEMS Microbiol. Rev.</italic></source> <volume>28</volume> <fpage>79</fpage>&#x2013;<lpage>100</lpage>. <pub-id pub-id-type="doi">10.1016/j.femsre.2003.09.001</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garcillan-Barcia</surname> <given-names>M. P.</given-names></name> <name><surname>Francia</surname> <given-names>M. V.</given-names></name> <name><surname>De La Cruz</surname> <given-names>F.</given-names></name></person-group> (<year>2009</year>). <article-title>The diversity of conjugative relaxases and its application in plasmid classification.</article-title> <source><italic>FEMS Microbiol. Rev.</italic></source> <volume>33</volume> <fpage>657</fpage>&#x2013;<lpage>687</lpage>.</citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gibbs</surname> <given-names>M. J.</given-names></name> <name><surname>Smeianov</surname> <given-names>V. V.</given-names></name> <name><surname>Steele</surname> <given-names>J. L.</given-names></name> <name><surname>Upcroft</surname> <given-names>P.</given-names></name> <name><surname>Efimov</surname> <given-names>B. A.</given-names></name></person-group> (<year>2006</year>). <article-title>Two families of rep-like genes that probably originated by interspecies recombination are represented in viral, plasmid, bacterial, and parasitic protozoan genomes.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>23</volume> <fpage>1097</fpage>&#x2013;<lpage>1100</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msj122</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Giovanetti</surname> <given-names>E.</given-names></name> <name><surname>Brenciani</surname> <given-names>A.</given-names></name> <name><surname>Tiberi</surname> <given-names>E.</given-names></name> <name><surname>Bacciaglia</surname> <given-names>A.</given-names></name> <name><surname>Varaldo</surname> <given-names>P. E.</given-names></name></person-group> (<year>2012</year>). <article-title>ICESp2905, the erm(TR)-tet(O) element of <italic>Streptococcus pyogenes</italic>, is formed by two independent integrative and conjugative elements.</article-title> <source><italic>Antimicrob. Agents Chemother.</italic></source> <volume>56</volume> <fpage>591</fpage>&#x2013;<lpage>594</lpage>. <pub-id pub-id-type="doi">10.1128/AAC.05352-11</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gouy</surname> <given-names>M.</given-names></name> <name><surname>Guindon</surname> <given-names>S.</given-names></name> <name><surname>Gascuel</surname> <given-names>O.</given-names></name></person-group> (<year>2010</year>). <article-title>SeaView version 4: a multiplatform graphical user interface for sequence alignment and phylogenetic tree building.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>27</volume> <fpage>221</fpage>&#x2013;<lpage>224</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msp259</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guerillot</surname> <given-names>R.</given-names></name> <name><surname>Da Cunha</surname> <given-names>V.</given-names></name> <name><surname>Sauvage</surname> <given-names>E.</given-names></name> <name><surname>Bouchier</surname> <given-names>C.</given-names></name> <name><surname>Glaser</surname> <given-names>P.</given-names></name></person-group> (<year>2013</year>). <article-title>Modular evolution of TnGBSs, a new family of integrative and conjugative elements associating insertion sequence transposition, plasmid replication, and conjugation for their spreading.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>195</volume> <fpage>1979</fpage>&#x2013;<lpage>1990</lpage>. <pub-id pub-id-type="doi">10.1128/JB.01745-12</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guglielmini</surname> <given-names>J.</given-names></name> <name><surname>De La Cruz</surname> <given-names>F.</given-names></name> <name><surname>Rocha</surname> <given-names>E. P.</given-names></name></person-group> (<year>2013</year>). <article-title>Evolution of conjugation and type IV secretion systems.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>30</volume> <fpage>315</fpage>&#x2013;<lpage>331</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mss221</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guglielmini</surname> <given-names>J.</given-names></name> <name><surname>Neron</surname> <given-names>B.</given-names></name> <name><surname>Abby</surname> <given-names>S. S.</given-names></name> <name><surname>Garcillan-Barcia</surname> <given-names>M. P.</given-names></name> <name><surname>De La Cruz</surname> <given-names>F.</given-names></name> <name><surname>Rocha</surname> <given-names>E. P.</given-names></name></person-group> (<year>2014</year>). <article-title>Key components of the eight classes of type IV secretion systems involved in bacterial conjugation or protein secretion.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>42</volume> <fpage>5715</fpage>&#x2013;<lpage>5727</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gku194</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guglielmini</surname> <given-names>J.</given-names></name> <name><surname>Quintais</surname> <given-names>L.</given-names></name> <name><surname>Garcillan-Barcia</surname> <given-names>M. P.</given-names></name> <name><surname>De La Cruz</surname> <given-names>F.</given-names></name> <name><surname>Rocha</surname> <given-names>E. P.</given-names></name></person-group> (<year>2011</year>). <article-title>The repertoire of ICE in prokaryotes underscores the unity, diversity, and ubiquity of conjugation.</article-title> <source><italic>PLoS Genet.</italic></source> <volume>7</volume>:<issue>e1002222</issue>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1002222</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ilangovan</surname> <given-names>A.</given-names></name> <name><surname>Connery</surname> <given-names>S.</given-names></name> <name><surname>Waksman</surname> <given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>Structural biology of the gram-negative bacterial conjugation systems.</article-title> <source><italic>Trends Microbiol.</italic></source> <volume>23</volume> <fpage>301</fpage>&#x2013;<lpage>310</lpage>. <pub-id pub-id-type="doi">10.1016/j.tim.2015.02.012</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krzywinski</surname> <given-names>M.</given-names></name> <name><surname>Schein</surname> <given-names>J.</given-names></name> <name><surname>Birol</surname> <given-names>I.</given-names></name> <name><surname>Connors</surname> <given-names>J.</given-names></name> <name><surname>Gascoyne</surname> <given-names>R.</given-names></name> <name><surname>Horsman</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Circos: an information aesthetic for comparative genomics.</article-title> <source><italic>Genome Res.</italic></source> <volume>19</volume> <fpage>1639</fpage>&#x2013;<lpage>1645</lpage>. <pub-id pub-id-type="doi">10.1101/gr.092759.109</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kunkel</surname> <given-names>B.</given-names></name> <name><surname>Losick</surname> <given-names>R.</given-names></name> <name><surname>Stragier</surname> <given-names>P.</given-names></name></person-group> (<year>1990</year>). <article-title>The <italic>Bacillus subtilis</italic> gene for the development transcription factor sigma K is generated by excision of a dispensable DNA element containing a sporulation recombinase gene.</article-title> <source><italic>Genes Dev.</italic></source> <volume>4</volume> <fpage>525</fpage>&#x2013;<lpage>535</lpage>.</citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>C. A.</given-names></name> <name><surname>Babic</surname> <given-names>A.</given-names></name> <name><surname>Grossman</surname> <given-names>A. D.</given-names></name></person-group> (<year>2010</year>). <article-title>Autonomous plasmid-like replication of a conjugative transposon.</article-title> <source><italic>Mol. Microbiol.</italic></source> <volume>75</volume> <fpage>268</fpage>&#x2013;<lpage>279</lpage>.<pub-id pub-id-type="doi">10.1111/j.1365-2958.2009.06985.x</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>C. A.</given-names></name> <name><surname>Thomas</surname> <given-names>J.</given-names></name> <name><surname>Grossman</surname> <given-names>A. D.</given-names></name></person-group> (<year>2012</year>). <article-title>The <italic>Bacillus subtilis</italic> conjugative transposon ICEBs1 mobilizes plasmids lacking dedicated mobilization functions.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>194</volume> <fpage>3165</fpage>&#x2013;<lpage>3172</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00301-12</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lorenzo-Diaz</surname> <given-names>F.</given-names></name> <name><surname>Fernandez-Lopez</surname> <given-names>C.</given-names></name> <name><surname>Douarre</surname> <given-names>P. E.</given-names></name> <name><surname>Baez-Ortega</surname> <given-names>A.</given-names></name> <name><surname>Flores</surname> <given-names>C.</given-names></name> <name><surname>Glaser</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Streptococcal group B integrative and mobilizable element IMESag-rpsI encodes a functional relaxase involved in its transfer.</article-title> <source><italic>Open Biol.</italic></source> <volume>6</volume>:<issue>160084</issue>. <pub-id pub-id-type="doi">10.1098/rsob.160084</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lorenzo-Diaz</surname> <given-names>F.</given-names></name> <name><surname>Fernandez-Lopez</surname> <given-names>C.</given-names></name> <name><surname>Garcillan-Barcia</surname> <given-names>M. P.</given-names></name> <name><surname>Espinosa</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). <article-title>Bringing them together: plasmid pMV158 rolling circle replication and conjugation under an evolutionary perspective.</article-title> <source><italic>Plasmid</italic></source> <volume>74</volume> <fpage>15</fpage>&#x2013;<lpage>31</lpage>.<pub-id pub-id-type="doi">10.1016/j.plasmid.2014.05.004</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McDonnell</surname> <given-names>B.</given-names></name> <name><surname>Mahony</surname> <given-names>J.</given-names></name> <name><surname>Neve</surname> <given-names>H.</given-names></name> <name><surname>Hanemaaijer</surname> <given-names>L.</given-names></name> <name><surname>Noben</surname> <given-names>J. P.</given-names></name> <name><surname>Kouwen</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Identification and analysis of a novel group of bacteriophages infecting the lactic acid bacterium <italic>Streptococcus thermophilus</italic>.</article-title> <source><italic>Appl. Environ. Microbiol.</italic></source> <volume>82</volume> <fpage>5153</fpage>&#x2013;<lpage>5165</lpage>. <pub-id pub-id-type="doi">10.1128/AEM.00835-16</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meyer</surname> <given-names>R.</given-names></name></person-group> (<year>2009</year>). <article-title>Replication and conjugative mobilization of broad host-range IncQ plasmids.</article-title> <source><italic>Plasmid</italic></source> <volume>62</volume> <fpage>57</fpage>&#x2013;<lpage>70</lpage>. <pub-id pub-id-type="doi">10.1016/j.plasmid.2009.05.001</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Naglich</surname> <given-names>J. G.</given-names></name> <name><surname>Andrews</surname> <given-names>R. E.</given-names> <suffix>Jr.</suffix></name></person-group> (<year>1988</year>). <article-title>Tn916-dependent conjugal transfer of PC194 and PUB110 from <italic>Bacillus subtilis</italic> into <italic>Bacillus thuringiensis</italic> subsp. israelensis.</article-title> <source><italic>Plasmid</italic></source> <volume>20</volume> <fpage>113</fpage>&#x2013;<lpage>126</lpage>.</citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>O&#x2019;Brien</surname> <given-names>F. G.</given-names></name> <name><surname>Yui Eto</surname> <given-names>K.</given-names></name> <name><surname>Murphy</surname> <given-names>R. J.</given-names></name> <name><surname>Fairhurst</surname> <given-names>H. M.</given-names></name> <name><surname>Coombs</surname> <given-names>G. W.</given-names></name> <name><surname>Grubb</surname> <given-names>W. B.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Origin-of-transfer sequences facilitate mobilisation of non-conjugative antimicrobial-resistance plasmids in <italic>Staphylococcus aureus</italic>.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>7971</fpage>&#x2013;<lpage>7983</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv755</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pavlovic</surname> <given-names>G.</given-names></name> <name><surname>Burrus</surname> <given-names>V.</given-names></name> <name><surname>Gintz</surname> <given-names>B.</given-names></name> <name><surname>Decaris</surname> <given-names>B.</given-names></name> <name><surname>Guedon</surname> <given-names>G.</given-names></name></person-group> (<year>2004</year>). <article-title>Evolution of genomic islands by deletion and tandem accretion by site-specific recombination: ICESt1-related elements from <italic>Streptococcus thermophilus</italic>.</article-title> <source><italic>Microbiology</italic></source> <volume>150</volume> <fpage>759</fpage>&#x2013;<lpage>774</lpage>. <pub-id pub-id-type="doi">10.1099/mic.0.26883-0</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pollet</surname> <given-names>R. M.</given-names></name> <name><surname>Ingle</surname> <given-names>J. D.</given-names></name> <name><surname>Hymes</surname> <given-names>J. P.</given-names></name> <name><surname>Eakes</surname> <given-names>T. C.</given-names></name> <name><surname>Eto</surname> <given-names>K. Y.</given-names></name> <name><surname>Kwong</surname> <given-names>S. M.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Processing of nonconjugative resistance plasmids by conjugation nicking enzyme of Staphylococci.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>198</volume> <fpage>888</fpage>&#x2013;<lpage>897</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00832-15</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Puymege</surname> <given-names>A.</given-names></name> <name><surname>Bertin</surname> <given-names>S.</given-names></name> <name><surname>Guedon</surname> <given-names>G.</given-names></name> <name><surname>Payot</surname> <given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>Analysis of <italic>Streptococcus agalactiae</italic> pan-genome for prevalence, diversity and functionality of integrative and conjugative or mobilizable elements integrated in the tRNA(Lys CTT) gene.</article-title> <source><italic>Mol. Genet. Genomics</italic></source> <volume>290</volume> <fpage>1727</fpage>&#x2013;<lpage>1740</lpage>. <pub-id pub-id-type="doi">10.1007/s00438-015-1031-9</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rabinovich</surname> <given-names>L.</given-names></name> <name><surname>Sigal</surname> <given-names>N.</given-names></name> <name><surname>Borovok</surname> <given-names>I.</given-names></name> <name><surname>Nir-Paz</surname> <given-names>R.</given-names></name> <name><surname>Herskovits</surname> <given-names>A. A.</given-names></name></person-group> (<year>2012</year>). <article-title>Prophage excision activates <italic>Listeria</italic> competence genes that promote phagosomal escape and virulence.</article-title> <source><italic>Cell</italic></source> <volume>150</volume> <fpage>792</fpage>&#x2013;<lpage>802</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2012.06.036</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ramsay</surname> <given-names>J. P.</given-names></name> <name><surname>Sullivan</surname> <given-names>J. T.</given-names></name> <name><surname>Stuart</surname> <given-names>G. S.</given-names></name> <name><surname>Lamont</surname> <given-names>I. L.</given-names></name> <name><surname>Ronson</surname> <given-names>C. W.</given-names></name></person-group> (<year>2006</year>). <article-title>Excision and transfer of the <italic>Mesorhizobium loti</italic> R7A symbiosis island requires an integrase IntS, a novel recombination directionality factor RdfS, and a putative relaxase RlxS.</article-title> <source><italic>Mol. Microbiol.</italic></source> <volume>62</volume> <fpage>723</fpage>&#x2013;<lpage>734</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2958.2006.05396.x</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Richards</surname> <given-names>V. P.</given-names></name> <name><surname>Palmer</surname> <given-names>S. R.</given-names></name> <name><surname>Pavinski Bitar</surname> <given-names>P. D.</given-names></name> <name><surname>Qin</surname> <given-names>X.</given-names></name> <name><surname>Weinstock</surname> <given-names>G. M.</given-names></name> <name><surname>Highlander</surname> <given-names>S. K.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Phylogenomics and the dynamic genome evolution of the genus <italic>Streptococcus</italic>.</article-title> <source><italic>Genome Biol. Evol.</italic></source> <volume>6</volume> <fpage>741</fpage>&#x2013;<lpage>753</lpage>.<pub-id pub-id-type="doi">10.1093/gbe/evu048</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shkoporov</surname> <given-names>A. N.</given-names></name> <name><surname>Efimov</surname> <given-names>B. A.</given-names></name> <name><surname>Khokhlova</surname> <given-names>E. V.</given-names></name> <name><surname>Steele</surname> <given-names>J. L.</given-names></name> <name><surname>Kafarskaia</surname> <given-names>L. I.</given-names></name> <name><surname>Smeianov</surname> <given-names>V. V.</given-names></name></person-group> (<year>2008</year>). <article-title>Characterization of plasmids from human infant <italic>Bifidobacterium</italic> strains: sequence analysis and construction of <italic>E. coli</italic>-<italic>Bifidobacterium</italic> shuttle vectors.</article-title> <source><italic>Plasmid</italic></source> <volume>60</volume> <fpage>136</fpage>&#x2013;<lpage>148</lpage>. <pub-id pub-id-type="doi">10.1016/j.plasmid.2008.06.005</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Showsh</surname> <given-names>S. A.</given-names></name> <name><surname>Andrews</surname> <given-names>R. E.</given-names> <suffix>Jr.</suffix></name></person-group> (<year>1999</year>). <article-title>Analysis of the requirement for a pUB110 mob region during Tn916-dependent mobilization.</article-title> <source><italic>Plasmid</italic></source> <volume>41</volume> <fpage>179</fpage>&#x2013;<lpage>186</lpage>. <pub-id pub-id-type="doi">10.1006/plas.1999.1398</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sievers</surname> <given-names>F.</given-names></name> <name><surname>Wilm</surname> <given-names>A.</given-names></name> <name><surname>Dineen</surname> <given-names>D.</given-names></name> <name><surname>Gibson</surname> <given-names>T. J.</given-names></name> <name><surname>Karplus</surname> <given-names>K.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Fast, scalable generation of high-quality protein multiple sequence alignments using Clustal Omega.</article-title> <source><italic>Mol. Syst. Biol.</italic></source> <volume>7</volume> <issue>539</issue>. <pub-id pub-id-type="doi">10.1038/msb.2011.75</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smillie</surname> <given-names>C.</given-names></name> <name><surname>Garcillan-Barcia</surname> <given-names>M. P.</given-names></name> <name><surname>Francia</surname> <given-names>M. V.</given-names></name> <name><surname>Rocha</surname> <given-names>E. P.</given-names></name> <name><surname>De La Cruz</surname> <given-names>F.</given-names></name></person-group> (<year>2010</year>). <article-title>Mobility of plasmids.</article-title> <source><italic>Microbiol. Mol. Biol. Rev.</italic></source> <volume>74</volume> <fpage>434</fpage>&#x2013;<lpage>452</lpage>. <pub-id pub-id-type="doi">10.1128/MMBR.00020-10</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tamura</surname> <given-names>K.</given-names></name> <name><surname>Stecher</surname> <given-names>G.</given-names></name> <name><surname>Peterson</surname> <given-names>D.</given-names></name> <name><surname>Filipski</surname> <given-names>A.</given-names></name> <name><surname>Kumar</surname> <given-names>S.</given-names></name></person-group> (<year>2013</year>). <article-title>MEGA6: molecular evolutionary genetics analysis version 6.0.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>30</volume><fpage>2725</fpage>&#x2013;<lpage>2729</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst197</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname> <given-names>F.</given-names></name> <name><surname>Bossers</surname> <given-names>A.</given-names></name> <name><surname>Harders</surname> <given-names>F.</given-names></name> <name><surname>Lu</surname> <given-names>C.</given-names></name> <name><surname>Smith</surname> <given-names>H.</given-names></name></person-group> (<year>2013</year>). <article-title>Comparative genomic analysis of twelve <italic>Streptococcus suis</italic> (pro)phages.</article-title> <source><italic>Genomics</italic></source> <volume>101</volume><fpage>336</fpage>&#x2013;<lpage>344</lpage>. <pub-id pub-id-type="doi">10.1016/j.ygeno.2013.04.005</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Trotter</surname> <given-names>M.</given-names></name> <name><surname>Mcauliffe</surname> <given-names>O.</given-names></name> <name><surname>Callanan</surname> <given-names>M.</given-names></name> <name><surname>Edwards</surname> <given-names>R.</given-names></name> <name><surname>Fitzgerald</surname> <given-names>G. F.</given-names></name> <name><surname>Coffey</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>Genome analysis of the obligately lytic bacteriophage 4268 of <italic>Lactococcus lactis</italic> provides insight into its adaptable nature.</article-title> <source><italic>Gene</italic></source> <volume>366</volume> <fpage>189</fpage>&#x2013;<lpage>199</lpage>. <pub-id pub-id-type="doi">10.1016/j.gene.2005.09.022</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weaver</surname> <given-names>K. E.</given-names></name> <name><surname>Kwong</surname> <given-names>S. M.</given-names></name> <name><surname>Firth</surname> <given-names>N.</given-names></name> <name><surname>Francia</surname> <given-names>M. V.</given-names></name></person-group> (<year>2009</year>). <article-title>The RepA_N replicons of gram-positive bacteria: a family of broadly distributed but narrow host range plasmids.</article-title> <source><italic>Plasmid</italic></source> <volume>61</volume> <fpage>94</fpage>&#x2013;<lpage>109</lpage>. <pub-id pub-id-type="doi">10.1016/j.plasmid.2008.11.004</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wisniewski</surname> <given-names>J. A.</given-names></name> <name><surname>Traore</surname> <given-names>D. A.</given-names></name> <name><surname>Bannam</surname> <given-names>T. L.</given-names></name> <name><surname>Lyras</surname> <given-names>D.</given-names></name> <name><surname>Whisstock</surname> <given-names>J. C.</given-names></name> <name><surname>Rood</surname> <given-names>J. I.</given-names></name></person-group> (<year>2016</year>). <article-title>TcpM: a novel relaxase that mediates transfer of large conjugative plasmids from <italic>Clostridium perfringens</italic>.</article-title> <source><italic>Mol. Microbiol.</italic></source> <volume>99</volume><fpage>884</fpage>&#x2013;<lpage>896</lpage>. <pub-id pub-id-type="doi">10.1111/mmi.13270</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="fn01"><label>1</label><p><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/genome/browse/">http://www.ncbi.nlm.nih.gov/genome/browse/</ext-link>, last accessed December 2013</p></fn>
<fn id="fn02"><label>2</label><p><ext-link ext-link-type="uri" xlink:href="http://central.biomart.org/">http://central.biomart.org/</ext-link></p></fn>
<fn id="fn03"><label>3</label><p><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/Structure/cdd/wrpsb.cgi">http://www.ncbi.nlm.nih.gov/Structure/cdd/wrpsb.cgi</ext-link></p></fn>
<fn id="fn04"><label>4</label><p><ext-link ext-link-type="uri" xlink:href="http://mobyle.pasteur.fr/cgi-bin/portal.py&#x005C;#forms::CONJscan-T4SSscan">http://mobyle.pasteur.fr/cgi-bin/portal.py&#x005C;#forms::CONJscan-T4SSscan</ext-link></p></fn>
<fn id="fn05"><label>5</label><p><ext-link ext-link-type="uri" xlink:href="https://toolkit.tuebingen.mpg.de/blastclust">https://toolkit.tuebingen.mpg.de/blastclust</ext-link></p></fn>
<fn id="fn06"><label>6</label><p><ext-link ext-link-type="uri" xlink:href="http://circos.ca/">http://circos.ca/</ext-link></p></fn>
</fn-group>
</back>
</article>