<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2017.02504</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Comparative Metagenomics of Cellulose- and Poplar Hydrolysate-Degrading Microcosms from Gut Microflora of the Canadian Beaver (<italic>Castor canadensis</italic>) and North American Moose (<italic>Alces americanus</italic>) after Long-Term Enrichment</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Wong</surname> <given-names>Mabel T.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Weijun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/313476/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Couturier</surname> <given-names>Marie</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Razeq</surname> <given-names>Fakhria M.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/494629/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Lombard</surname> <given-names>Vincent</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/504932/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Lapebie</surname> <given-names>Pascal</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/504931/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Edwards</surname> <given-names>Elizabeth A.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/90890/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Terrapon</surname> <given-names>Nicolas</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/504927/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Henrissat</surname> <given-names>Bernard</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/18544/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Master</surname> <given-names>Emma R.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/314245/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Chemical Engineering and Applied Chemistry, University of Toronto</institution>, <addr-line>Toronto, ON</addr-line>, <country>Canada</country></aff>
<aff id="aff2"><sup>2</sup><institution>Centre de Recherches sur les Macromol&#x00E9;cules V&#x00E9;g&#x00E9;tales &#x2013; Universit&#x00E9; Grenoble Alpes</institution>, <addr-line>Grenoble</addr-line>, <country>France</country></aff>
<aff id="aff3"><sup>3</sup><institution>Centre National de la Recherche Scientifique, Centre de Recherches sur les Macromol&#x00E9;cules V&#x00E9;g&#x00E9;tales</institution>, <addr-line>Grenoble</addr-line>, <country>France</country></aff>
<aff id="aff4"><sup>4</sup><institution>Architecture et Fonction des Macromol&#x00E9;cules Biologiques, Aix-Marseille Universit&#x00E9;</institution>, <addr-line>Marseille</addr-line>, <country>France</country></aff>
<aff id="aff5"><sup>5</sup><institution>UMR 7257, Centre National de la Recherche Scientifique</institution>, <addr-line>Marseille</addr-line>, <country>France</country></aff>
<aff id="aff6"><sup>6</sup><institution>Department of Biological Sciences, King Abdulaziz University</institution>, <addr-line>Jeddah</addr-line>, <country>Saudi Arabia</country></aff>
<aff id="aff7"><sup>7</sup><institution>Department of Bioproducts and Biosystems, Aalto University</institution>, <addr-line>Espoo</addr-line>, <country>Finland</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: <italic>Guillermina Hernandez-Raquet, Institut National de la Recherche Agronomique (INRA), France</italic></p></fn>
<fn fn-type="edited-by"><p>Reviewed by: <italic>Xiuzhu Dong, Institute of Microbiology (CAS), China; Suzanne Lynn Ishaq, University of Oregon, United States</italic></p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x002A;Correspondence: <italic>Emma R. Master, <email>emma.master@utoronto.ca</email></italic></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Systems Microbiology, a section of the journal Frontiers in Microbiology</p></fn></author-notes>
<pub-date pub-type="epub">
<day>20</day>
<month>12</month>
<year>2017</year>
</pub-date>
<pub-date pub-type="collection">
<year>2017</year>
</pub-date>
<volume>8</volume>
<elocation-id>2504</elocation-id>
<history>
<date date-type="received">
<day>12</day>
<month>10</month>
<year>2017</year>
</date>
<date date-type="accepted">
<day>01</day>
<month>12</month>
<year>2017</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2017 Wong, Wang, Couturier, Razeq, Lombard, Lapebie, Edwards, Terrapon, Henrissat and Master.</copyright-statement>
<copyright-year>2017</copyright-year>
<copyright-holder>Wong, Wang, Couturier, Razeq, Lombard, Lapebie, Edwards, Terrapon, Henrissat and Master</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>To identify carbohydrate-active enzymes (CAZymes) that might be particularly relevant for wood fiber processing, we performed a comparative metagenomic analysis of digestive systems from Canadian beaver (<italic>Castor canadensis</italic>) and North American moose (<italic>Alces americanus</italic>) following 3 years of enrichment on either microcrystalline cellulose or poplar hydrolysate. In total, 9,386 genes encoding CAZymes and carbohydrate-binding modules (CBMs) were identified, with up to half predicted to originate from <italic>Firmicutes, Bacteroidetes, Chloroflexi</italic>, and <italic>Proteobacteria</italic> phyla, and up to 17% from unknown phyla. Both PCA and hierarchical cluster analysis distinguished the annotated glycoside hydrolase (GH) distributions identified herein, from those previously reported for grass-feeding mammals and herbivorous foragers. The CAZyme profile of moose rumen enrichments also differed from a recently reported moose rumen metagenome, most notably by the absence of GH13-appended dockerins. Consistent with substrate-driven convergence, CAZyme profiles from both poplar hydrolysate-fed cultures differed from cellulose-fed cultures, most notably by increased numbers of unique sequences belonging to families GH3, GH5, GH43, GH53, and CE1. Moreover, pairwise comparisons of moose rumen enrichments further revealed higher counts of GH127 and CE15 families in cultures fed with poplar hydrolysate. To expand our scope to lesser known carbohydrate-active proteins, we identified and compared multi-domain proteins comprising both a CBM and domain of unknown function (DUF) as well as proteins with unknown function within the 416 predicted polysaccharide utilization loci (PULs). Interestingly, DUF362, identified in iron&#x2013;sulfur proteins, was consistently appended to CBM9; on the other hand, proteins with unknown function from PULs shared little identity unless from identical PULs. Overall, this study sheds new light on the lignocellulose degrading capabilities of microbes originating from digestive systems of mammals known for fiber-rich diets, and highlights the value of enrichment to select new CAZymes from metagenome sequences for future biochemical characterization.</p>
</abstract>
<kwd-group>
<kwd>comparative metagenomics</kwd>
<kwd>lignocellulose degradation</kwd>
<kwd>carbohydrate-active enzymes (CAZymes)</kwd>
<kwd>polysaccharide utilization loci (PULs)</kwd>
<kwd>microbial enrichment</kwd>
<kwd>digestive microbiome</kwd>
<kwd>beaver</kwd>
<kwd>moose</kwd>
</kwd-group>
<contract-num rid="cn001">322820</contract-num>
<contract-num rid="cn002">648925</contract-num>
<contract-sponsor id="cn001">European Research Council<named-content content-type="fundref-id">10.13039/501100000781</named-content></contract-sponsor>
<contract-sponsor id="cn002">European Research Council<named-content content-type="fundref-id">10.13039/501100000781</named-content></contract-sponsor>
<counts>
<fig-count count="7"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="67"/>
<page-count count="14"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec><title>Introduction</title>
<p>Lignocellulose comprises the non-edible fraction of plant biomass and as such is a recognized resource for the production of renewable energy, chemicals, and materials. The main components of lignocellulose are cellulose, hemicellulose, pectin, and lignin, the proportions and particular chemistries of which depend largely on the plant type and fraction (<xref ref-type="bibr" rid="B33">Kumar et al., 2008</xref>). For instance, glucuronoarabinoxylan is a typical hemicellulose found in agricultural crops, whereas glucuronoxylan is the predominant hemicellulose in wood tissue of deciduous trees, including poplar (<xref ref-type="bibr" rid="B47">Peng et al., 2012</xref>). Bioconversion pathways that convert various lignocellulose sources to targeted end products require the concerted action of CAZymes, which include glycosyl hydrolases (GHs), carbohydrate esterases (CEs), polysaccharide lyases (PLs), auxiliary activities (AAs), and of carbohydrate binding modules (CBMs) that are classified into families according to amino acid sequence similarity in the CAZy database<sup><xref ref-type="fn" rid="fn01">1</xref></sup> (<xref ref-type="bibr" rid="B35">Lombard et al., 2014</xref>). Various pretreatment methods, including steam explosion, have been developed to maximize enzymatic conversion of lignocellulosic resources (<xref ref-type="bibr" rid="B19">Excoffier et al., 1991</xref>).</p>
<p>Metagenomic approaches to identify CAZymes relevant to the conversion of a given biomass feedstock have considered environmental samples persistently subjected to the targeted feedstock. For example, metagenomic analyses aimed at identifying CAZymes most relevant to bioconversion of non-woody biomass have sampled digestive systems of animals that graze on straw, grasses, and lichens (<xref ref-type="bibr" rid="B49">Pope et al., 2010</xref>). Parallel metagenomic analyses to identify CAZymes contributing to bioconversion of woody biomass have included samples ranging from forest soils (<xref ref-type="bibr" rid="B16">Damon et al., 2012</xref>; <xref ref-type="bibr" rid="B48">Pold et al., 2016</xref>), to insects (<xref ref-type="bibr" rid="B63">Warnecke et al., 2007</xref>; <xref ref-type="bibr" rid="B24">He et al., 2013</xref>; <xref ref-type="bibr" rid="B52">Rossmassler et al., 2015</xref>), and wood-feeding mollusks (<xref ref-type="bibr" rid="B45">O&#x2019;Connor et al., 2014</xref>). Alternatively, enrichment of environmental samples on specific biomass feedstocks prior to metagenome sequencing can improve sequence assembly (<xref ref-type="bibr" rid="B18">DeAngelis et al., 2010</xref>), while facilitating the identification of most pertinent CAZymes (<xref ref-type="bibr" rid="B60">van der Lelie et al., 2012</xref>). In a few cases, direct comparison of CAZyme profiles has also been performed for enrichment cultures originating from the same source. Examples include soil-derived microbial communities enriched with wheat straw, switchgrass, and corn stover (<xref ref-type="bibr" rid="B30">Jimen&#x00E9;z et al., 2016</xref>), and those digesting mixed lignocellulosic substrates in stationary versus submerged and agitated conditions (<xref ref-type="bibr" rid="B25">Heiss-Blanquet et al., 2016</xref>; <xref ref-type="bibr" rid="B62">Wang et al., 2016</xref>). In addition to the influence of enrichment condition, such metagenomic studies highlight the increase in number of CAZyme sequences from families associated with hydrolysis of oligosaccharides and side groups of hemicelluloses and/or pectins (e.g., GH3, GH43).</p>
<p>Aside from identifying CAZyme families most pertinent to conversion of specific biomass feedstocks, metagenomic analysis of biomass-degrading communities has uncovered a diverse array of encoded polysaccharide utilization loci (PULs) and multi-modular proteins. Briefly, PULs comprise physically linked genes that encode CAZymes and other proteins that work in concert to degrade specific glycans. Accordingly, PULs have emerged as especially fruitful regions within metagenome sequences for enzyme discovery (<xref ref-type="bibr" rid="B34">Larsbrink et al., 2016</xref>; <xref ref-type="bibr" rid="B46">Patrascu et al., 2017</xref>). For instance, in the past year alone, detailed biochemical characterization of PULs with different selectivity has uncovered novel activities that contribute to the degradation of pectin (<xref ref-type="bibr" rid="B43">Ndeh et al., 2017</xref>), xylan (<xref ref-type="bibr" rid="B62">Wang et al., 2016</xref>), and galactomannan (<xref ref-type="bibr" rid="B7">Bagenholm et al., 2017</xref>), as well as fungal cell wall components including chitin (<xref ref-type="bibr" rid="B34">Larsbrink et al., 2016</xref>) and &#x03B2;-glucans (<xref ref-type="bibr" rid="B58">Temple et al., 2017</xref>). Likewise, multi-modular proteins and cellulosomal subunits identified from metagenome sequences and bacterial isolates constitute an additional reservoir for CAZyme discovery (<xref ref-type="bibr" rid="B66">Zhang et al., 2014</xref>). Most recently, CAZyme-linked dockerins were reported in PULs in a moose rumen microbiome (<xref ref-type="bibr" rid="B57">Svartstr&#x00F6;m et al., 2017</xref>).</p>
<p>With the aim to identify CAZymes and novel proteins that target woody biomass, here we applied a comparative metagenomics approach to identify microbial enzymes encoded by the gut digestive microflora of wood-feeding Canadian beaver (<italic>Castor canadensis</italic>) and North American moose (<italic>Alces americanus</italic>) that are likely to promote the conversion of pretreated wood chips. Briefly, in winter months especially, beavers apply an obligate woody diet consisting of twigs, bark, and tree trunks; such seasonal confinement to a wood-based diet is also common to moose, ungulates that consume twigs, shrubs, and bark during the winter (<xref ref-type="bibr" rid="B15">Chaney, 2003</xref>; <xref ref-type="bibr" rid="B27">Hood and Bayley, 2009</xref>). In an earlier study, we confirmed the existence of biomass-degrading microorganisms in gut digestive microflora of beaver and moose, and their ability to transform lignocellulosic substrates under anaerobic conditions (<xref ref-type="bibr" rid="B65">Wong et al., 2016</xref>). Herein, we report the metagenomes of corresponding gut digestive microflora enriched for over 3 years on either microcrystalline cellulose or pretreated poplar wood chips. In particular, metagenome sequences were compared to reveal CAZyme families that are consistently enriched following growth on poplar hydrolysate compared to growth on cellulose. The four metagenomes were also mined in an effort to identify novel candidate enzymes for future characterization. Two approaches were devised to facilitate this analysis: (1) prediction of bacterial PULs and analysis of encoded proteins with unknown function within PULs, and (2) prediction of multi-modular proteins that comprise both modules recognized to contribute to polysaccharide conversion (e.g., a carbohydrate-binding domain) and domains with unknown function.</p>
</sec>
<sec id="s1" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec><title>Ethics Statement</title>
<p>An ethics approval from an Animal Care and Use Committee was not required by the Office of Research Ethics of the University of Toronto, as the moose rumen sample was collected from a dead moose that was hunted in the wild for meat by a registered hunter with a license authorized by the Ministry of Natural Resources and Forestry under Government of Ontario, Canada.</p>
</sec>
<sec><title>Setup and Maintenance of Lignocellulose Active Enrichment Cultures</title>
<p>As previously described (<xref ref-type="bibr" rid="B65">Wong et al., 2016</xref>), lignocellulose-degrading microorganisms from the digestive systems of Canadian beaver (<italic>Castor canadensis</italic>) and North American moose (<italic>Alces americanus</italic>) were sampled and enriched under anaerobic conditions at 36&#x00B0;C. Briefly, approximately 15 ml of the beaver dropping and moose rumen inocula were transferred to separate 160 mM Wheaton glass serum bottles, which were amended with 45 mL of sulfide-reduced mineral medium and 36 mg COD equivalents of microcrystalline cellulose (Avicel PH101; purchased from Sigma&#x2013;Aldrich) or steam exploded poplar hydrolysate (provided by SunOpta Inc., Canada) (<xref ref-type="bibr" rid="B65">Wong et al., 2016</xref>). Biogas production by resulting cultures was carefully monitored to track metabolic activity.</p>
</sec>
<sec><title>Metagenomic DNA Extraction and Sequencing</title>
<p>Following 3 years of cultivation and 10 enrichment phases, 10 ml of each enrichment culture was harvested at early stationary phase of biogas production. Samples were centrifuged at 15,000 &#x00D7; <italic>g</italic> for 15 min at 4&#x00B0;C, and total community DNA was extracted using the QIAamp DNA Stool Mini Kit (Qiagen, Hilden, Germany) (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). The concentration and quality of the extracted metagenomic DNA were assessed by measuring the 260/280 absorbance ratio using a Nanodrop 2000 Spectrophotometer (Thermo Scientific, MA, United States), and then stored at -80&#x00B0;C. A TruSeq library was constructed for each DNA sample. Illumina paired-end sequencing was chosen and performed with Illumina HiSeq 2000 (Illumina Inc., San Diego, CA, United States) at G&#x00E9;nome Qu&#x00E9;bec Innovation Centre.</p>
</sec>
<sec><title>Metagenome Assembly</title>
<p>The output reads were processed by Trimmomatic 0.32 for the removal of adapters and quality filtering (<xref ref-type="bibr" rid="B12">Bolger et al., 2014</xref>). The quality-trimmed metagenomic reads were assembled using ABySS with minimum coverage of 20, and minimum kmer length of 96 nucleotides (<xref ref-type="bibr" rid="B53">Simpson et al., 2009</xref>). Using an in house Perl script, NKD of the assembled contigs were calculated using the formula NKD = <italic>n</italic>/(<italic>L</italic>-<italic>k</italic>+1), where <italic>n</italic> is the total number of kmers assembled to the contig, <italic>L</italic> is the contig length, and <italic>k</italic> is the kmer length (96) used in the assembly. Contig distributions were then visualized by plotting the calculated NKD against contig length.</p>
</sec>
<sec><title>Annotation of CAZyme Families, Multi-Modular Sequences, and Polysaccharide Utilization Loci (PULs)</title>
<p>Assembled contigs were subjected to ORF prediction using Prodigal (<xref ref-type="bibr" rid="B29">Hyatt et al., 2010</xref>); predicted proteins were then assigned to CAZyme families using a combination of BLAST and HMM searches against CAZy reference sequences and families as already described (<xref ref-type="bibr" rid="B2">Al-Masaudi et al., 2017</xref>). Counts of CAZyme sequences were normalized to compare the diversity of CAZyme sequences identified within each enrichment culture. Specifically, since the number of predicted ORFs was highest for the metagenome of beaver droppings enriched on poplar hydrolysate (BD-PH, <bold>Table <xref ref-type="table" rid="T1">1</xref></bold>) then:</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Statistics of the sequencing and assembly of the metagenomes of cellulose (C) and poplar hydrolysate (PH)-fed enrichment cultures from beaver dropping (BD) and moose rumen (MR).</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Inocula<hr/></th>
<th valign="top" align="center" colspan="2">Beaver droppings<hr/></th>
<th valign="top" align="center" colspan="2">Moose rumen<hr/></th></tr>
<tr>
<th valign="top" align="left">Enrichment</th>
<th valign="top" align="center">Cellulose</th>
<th valign="top" align="center">Poplar hydrolysate</th>
<th valign="top" align="center">Cellulose</th>
<th valign="top" align="center">Poplar hydrolysate</th>
</tr>
<tr>
<th valign="top" align="left">Abbreviation</th>
<th valign="top" align="center">BD-C</th>
<th valign="top" align="center">BD-PH</th>
<th valign="top" align="center">MR-C</th>
<th valign="top" align="center">MR-PH</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Number of quality trimmed reads (% passed)</td>
<td valign="top" align="center">74,999,337 (99.7%)</td>
<td valign="top" align="center">78,144,385 (99.7%)</td>
<td valign="top" align="center">71,980,296 (99.8%)</td>
<td valign="top" align="center">88,305,224 (99.8%)</td>
</tr>
<tr>
<td valign="top" align="left">Total Mbp assembled (Mbp)</td>
<td valign="top" align="center">78</td>
<td valign="top" align="center">81.5</td>
<td valign="top" align="center">58.3</td>
<td valign="top" align="center">67.6</td>
</tr>
<tr>
<td valign="top" align="left">Number of contigs</td>
<td valign="top" align="center">5,010</td>
<td valign="top" align="center">10,553</td>
<td valign="top" align="center">5,705</td>
<td valign="top" align="center">6,941</td>
</tr>
<tr>
<td valign="top" align="left">Longest contig (bp)</td>
<td valign="top" align="center">1,266,318</td>
<td valign="top" align="center">674,797</td>
<td valign="top" align="center">1,299,156</td>
<td valign="top" align="center">1,131,879</td>
</tr>
<tr>
<td valign="top" align="left">N50 (bp)</td>
<td valign="top" align="center">92,758</td>
<td valign="top" align="center">68,167</td>
<td valign="top" align="center">71,246</td>
<td valign="top" align="center">106,046</td>
</tr>
<tr>
<td valign="top" align="left">Number of ORFs</td>
<td valign="top" align="center">71,348</td>
<td valign="top" align="center">81,969</td>
<td valign="top" align="center">56,127</td>
<td valign="top" align="center">66,970</td>
</tr>
<tr>
<td valign="top" align="left">Normalized counts<sup>1</sup> of plant polysaccharide-active</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left">CAZymes (% of all CAZymes)</td>
<td valign="top" align="center">709 (23.4%)</td>
<td valign="top" align="center">830 (32.3%)</td>
<td valign="top" align="center">525 (22.4%)</td>
<td valign="top" align="center">834 (32.7%)</td>
</tr>
<tr>
<td valign="top" align="left">PUL</td>
<td valign="top" align="center">38</td>
<td valign="top" align="center">171</td>
<td valign="top" align="center">47</td>
<td valign="top" align="center">42</td></tr>
<tr>
<td valign="top" align="left">Type 1 dockerin</td>
<td valign="top" align="center">95</td>
<td valign="top" align="center">116</td>
<td valign="top" align="center">68</td>
<td valign="top" align="center">94</td>
</tr>
<tr>
<td valign="top" align="left">Type 1 cohesin</td>
<td valign="top" align="center">42</td>
<td valign="top" align="center">50</td>
<td valign="top" align="center">35</td>
<td valign="top" align="center">41</td></tr>
</tbody></table>
<table-wrap-foot>
<attrib><italic><sup>1</sup>Counts were normalized by the number of ORFs.</italic></attrib>
</table-wrap-foot>
</table-wrap>
<disp-formula id="E1"><mml:math id="M1"><mml:mrow><mml:mo>Normalized</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>count</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>=</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mfrac><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:mo>count</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>of</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>identified</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>sequences</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>in</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>a</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>given</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>CAZyme</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>family</mml:mo><mml:mo>&#x2009;</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mo>within</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>a</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>metagenome</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>of</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>interest</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>&#x00D7;</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>number</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>of</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>ORFs</mml:mo><mml:mo>&#x2009;</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mo>of</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>BD-PH</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>metagenome</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:mo>number</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>of</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>ORFs</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>of</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>a</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>metagenome</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>of</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>interest</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mfrac></mml:mrow></mml:math></disp-formula>
<p>Relative abundance for a given CAZyme family in a metagenome was calculated by</p>
<disp-formula id="E2"><mml:math id="M2"><mml:mrow><mml:mo>Relative</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>abundance</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>=</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mfrac><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:mo>identified</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>counts</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>for</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>a</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>given</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>CAZyme</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>family</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>in</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>a</mml:mo><mml:mo>&#x2009;</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mo>metagenome</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:mo>total</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>identified</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>counts</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>of</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>CAZyme</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>in</mml:mo><mml:mo>&#x2009;</mml:mo><mml:mo>a</mml:mo><mml:mo>&#x2009;</mml:mo></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mo>metagenome</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mfrac><mml:mo>&#x00D7;</mml:mo><mml:mn>100</mml:mn><mml:mi>&#x0025;</mml:mi></mml:mrow></mml:math></disp-formula>
<p>Public metagenomes from the digestive systems of cow (<xref ref-type="bibr" rid="B26">Hess et al., 2011</xref>), moose (<xref ref-type="bibr" rid="B57">Svartstr&#x00F6;m et al., 2017</xref>), panda (<xref ref-type="bibr" rid="B67">Zhu et al., 2011</xref>), reindeer (<xref ref-type="bibr" rid="B50">Pope et al., 2012</xref>), Saudi sheep (<xref ref-type="bibr" rid="B2">Al-Masaudi et al., 2017</xref>), termite (<xref ref-type="bibr" rid="B63">Warnecke et al., 2007</xref>), and wallaby (<xref ref-type="bibr" rid="B49">Pope et al., 2010</xref>) were also reannotated based on the latest version of the CAZy database and included in this calculation. Relative abundances of predicted plant (poly)saccharide-active CAZyme families (<bold>Figure <xref ref-type="fig" rid="F4">4</xref></bold>) were then extracted for hierarchical clustering (correlation clustering and average linkage) and PCA using R statistics in ClustVis (<xref ref-type="bibr" rid="B40">Metsalu and Vilo, 2015</xref>). Taxonomic assignment of predicted CAZymes from each metagenome was determined using protein sequences belonging to archaea, bacteria, fungi, other microbial eukaryotes, and viruses reported in the NCBI-NR database (downloaded 16 May 2017) using Kaiju in greedy mode with default settings (<xref ref-type="bibr" rid="B38">Menzel et al., 2016</xref>). The phylogenetic distributions of the top 10 identified organisms were visualized at phylum and class levels in a chord diagram using Circos (<xref ref-type="bibr" rid="B32">Krzywinski et al., 2009</xref>).</p>
<p>Cellulosomal modules (dockerin and cohesin domains) as well as S-layer homology domains were identified using reference sequences and models built from the literature (<xref ref-type="bibr" rid="B39">Mesnage et al., 2000</xref>; <xref ref-type="bibr" rid="B61">Venditto et al., 2016</xref>; <xref ref-type="bibr" rid="B4">Artzi et al., 2017</xref>). Proteins with CBMs appended to >200 amino acids not covered by any CAZy module were subjected to Pfam domain annotation (<xref ref-type="bibr" rid="B20">Finn et al., 2016</xref>) using InterProScan (<xref ref-type="bibr" rid="B31">Jones et al., 2014</xref>) to identify conserved DUF (Goodacre et al., 2014). PULs were predicted around <italic>susCD</italic>-like genes, and boundaries were extended based on intergenic distances, the presence of CAZymes and of regulatory genes (e.g., hybrid two-component system protein, extracytoplasmic function (ECF) &#x03C3;/anti-&#x03C3; factors, etc.) following the automatic method used in PULDB (<xref ref-type="bibr" rid="B59">Terrapon et al., 2015</xref>). The proteins with unknown functions from the PULs reported here and in PULDB<sup><xref ref-type="fn" rid="fn02">2</xref></sup> were pooled and submitted to CD-HIT web server (<xref ref-type="bibr" rid="B28">Huang et al., 2010</xref>) to identify proteins that meet a similarity threshold, which was defined by being &#x2265;70% identical to the representative sequence, and having &#x2265;70% alignment coverage. The sequence reads were submitted to NCBI under the Bioproject ID <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="SUB1022597">SUB1022597</ext-link>.</p>
</sec>
</sec>
<sec><title>Results and Discussion</title>
<sec><title>Metagenomic DNA Extraction and Sequencing Statistics</title>
<p>Each metagenomic DNA sample (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>) yielded 71&#x2013;88 Mb high-quality reads (150 bp long each), which were assembled into 5,010 to 10,553 contigs per metagenome (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>). The N50 (i.e., the length at which 50% of the assembled contigs were equal to or longer than) ranged between 68 and 105 kbp, and longest contigs were between 674 kbp and 1.13 Mbp. As shown in the summary of contig profiles (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S1</xref>), longer contigs were generally present at lower NKD.</p>
</sec>
<sec><title>Comparison of Predicted CAZyme Sequences with Existing Data Sets</title>
<p>In total, 9,386 genes encoding CAZymes and CBMs were predicted from the four metagenomes (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S2</xref>). These sequences were assigned to 100 distinct families of GHs, 13 families of CEs, 15 families of PLs, and 39 families of GTs, as well as 43 families of associated CBMs. As observed for other anaerobic microbial communities (<xref ref-type="bibr" rid="B2">Al-Masaudi et al., 2017</xref>; <xref ref-type="bibr" rid="B57">Svartstr&#x00F6;m et al., 2017</xref>), no auxiliary redox enzymes were identified.</p>
<p>On average, 13% (up to 17% in cellulose-fed moose rumen culture) of the annotated CAZymes were taxonomically unassigned or assigned to unknown species. The phylogenetic origins of the remaining varied among the metagenomes, with most of them derived from <italic>Firmicutes, Bacteroidetes, Chloroflexi</italic>, and <italic>Proteobacteria</italic> phyla (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>). Up to 14% of predicted CAZyme sequences from cellulose-fed enrichments were assigned to class <italic>Anaerolineae</italic>, whereas CAZyme assignments to class <italic>Gammaproteobacteria</italic> were unique to cultures fed on poplar hydrolysate (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold> and Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S2</xref>). By contrast, members from <italic>Clostridia</italic> and <italic>Bacteroidia</italic> classes contributed to 23&#x2013;52% of the annotated CAZymes across the metagenomes, where representation by these classes was between two and five times higher in poplar hydrolysate-fed cultures than in cellulose-fed ones. Moreover, CAZyme families that comprise plant polysaccharide-active enzymes (i.e., families GH2, GH3, GH5, GH9, GH43, GH51, and CE1) were most frequently assigned to either <italic>Clostridia</italic> or <italic>Bacteroidia</italic> (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S2</xref>). In particular, GH5 sequences were most frequently assigned to <italic>Clostridia</italic> in poplar hydrolysate-fed cultures, whereas GH2, GH3, and GH43 were most frequently assigned to class <italic>Bacteroidia</italic> in poplar hydrolysate-fed cultures.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Phylogenetic distribution of CAZyme sequences assigned to the top 10 identified classes.</p></caption>
<graphic xlink:href="fmicb-08-02504-g001.tif"/>
</fig>
<p>Considering all plant polysaccharides-degrading CAZymes predicted in each metagenome, more than half were less than 60% identical to the CAZyme amino acid sequences reported in the CAZy database (<bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>). While percent identities varied depending on CAZyme family (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S3</xref>), the most divergent sequences belong to families GH113 (on average 34% identical to their closest blast hits), PL22 (35%), GH5 (40%), GH74 (40%), and PL9 (43%).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Percent identity between amino acid sequences in the CAZy database and CAZyme sequences predicted in beaver dropping (BD) and moose rumen (MR) microcosms enriched with cellulose (C) and poplar hydrolysate (PH). Percent identities correspond to best blast hits in the CAZy database, and were obtained for CAZyme sequences belonging to CAZyme families known to contain enzymes that act on plant cell wall carbohydrates (<bold>Figure <xref ref-type="fig" rid="F4">4A</xref></bold>).</p></caption>
<graphic xlink:href="fmicb-08-02504-g002.tif"/>
</fig>
<p>Hierarchical clustering analysis of plant polysaccharide-active CAZyme families distinguished those reported in this study from those previously predicted from grass-feeding mammals or mixed plants foragers (<bold>Figure <xref ref-type="fig" rid="F3">3A</xref></bold>). In particular, the distribution of the CAZyme families predicted in moose rumen enrichments differed from that recently reported for the moose rumen metagenome (<xref ref-type="bibr" rid="B57">Svartstr&#x00F6;m et al., 2017</xref>), where highest contributing factors were attributed to relatively high abundance of CE4, GH94, and GH78 families, and low abundance of GH2, GH43 in the moose rumen enrichments (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S3</xref>). Consistent with substrate-induced convergence (<xref ref-type="bibr" rid="B65">Wong et al., 2016</xref>), long-term <italic>ex situ</italic> enrichment prior to metagenome sequencing also led to higher similarity of CAZyme distributions for cultures fed with the same carbon source (i.e., poplar hydrolysate or cellulose) as opposed to originating from the same environmental source (i.e., moose rumen or beaver droppings) (<bold>Figure <xref ref-type="fig" rid="F3">3A</xref></bold>). The observed substrate-driven convergence of metagenomes was mostly attributed to higher relative abundances of GH2, GH3, GH43, CE1, CE4 in cultures enriched on poplar hydrolysate (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S3</xref>). At the same time, a greater overlap of unique CAZyme sequences was observed between cultures fed with the same substrate than those with the same inoculum (<bold>Figure <xref ref-type="fig" rid="F3">3B</xref></bold>). It is also worthwhile to note that the plant polysaccharide-active CAZyme families from termite gut, albeit wood-feeding, do not cluster closely with those from the poplar hydrolysate enrichments due to the latter&#x2019;s lower relative abundances of GH5, GH10, and GH94 (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S3</xref>). This likely reflects differences in the wood substrates consumed, as well as intrinsic differences in the gut microbiome of mammals and insects. Nonetheless, along PC2 where these metagenomes diverge the most, the PCA plot depicted a closer resemblance of CAZyme profiles microbiomes from termite gut and moose rumen samples enriched on poplar hydrolysate, than that between the former and the non-enriched moose rumen.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p><bold>(A)</bold> Correlation clustering and PCA plots of CAZyme profiles encoded by metagenomes from lignocellulose degrading microbial communities. CAZyme families known to contain enzymes that act on plant cell wall carbohydrates were considered in the analysis. Public datasets included cow (<xref ref-type="bibr" rid="B26">Hess et al., 2011</xref>), moose (<xref ref-type="bibr" rid="B57">Svartstr&#x00F6;m et al., 2017</xref>), panda (<xref ref-type="bibr" rid="B67">Zhu et al., 2011</xref>), reindeer (<xref ref-type="bibr" rid="B50">Pope et al., 2012</xref>), Saudi sheep (<xref ref-type="bibr" rid="B2">Al-Masaudi et al., 2017</xref>), termite (<xref ref-type="bibr" rid="B63">Warnecke et al., 2007</xref>), and wallaby (<xref ref-type="bibr" rid="B49">Pope et al., 2010</xref>). A 3D PCA plot is shown on the top right corner with the corresponding 2D PCA plots shown at the bottom; confidence intervals (95%) are indicated by the ellipses. <bold>(B)</bold> Venn diagram showing a greater overlap of unique CAZyme sequences in cultures fed with the same substrates (numbers underlined) than those that originate from the same inocula (numbers in italics).</p></caption>
<graphic xlink:href="fmicb-08-02504-g003.tif"/>
</fig>
</sec>
<sec><title>Impact of Enrichment Substrate on Profiles of Predicted Plant&#x2013;Polysaccharide Degrading CAZyme Sequences</title>
<p>Metagenomes of cultures enriched on poplar hydrolysate yielded a higher proportion of predicted plant polysaccharides-active CAZymes (&#x223C;33%) compared to metagenomes of cultures enriched on cellulose (&#x223C;23%) (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold> and <bold>Figure <xref ref-type="fig" rid="F4">4A</xref></bold>). In particular, poplar hydrolysate-degrading communities were enriched in sequence counts from families GH3, GH5, GH43, CE1, and GH53 (<bold>Figure <xref ref-type="fig" rid="F4">4A</xref></bold>). Additional substrate-induced differences were noted when considering moose rumen and beaver dropping enrichments separately. Beaver dropping samples enriched on poplar hydrolysate encoded higher counts of GH2 (1.5 times higher) and GH106 (4.6 times) than corresponding samples enriched on cellulose (<bold>Figure <xref ref-type="fig" rid="F4">4B</xref></bold>). Meanwhile, moose rumen samples enriched on poplar hydrolysate encoded higher counts of GH9 (2 times higher), CE4 (1.8 times), GH127 (9 times), and CE15 (11 times) compared to corresponding samples enriched on cellulose (<bold>Figure <xref ref-type="fig" rid="F4">4B</xref></bold>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p><bold>(A)</bold> Distribution of plant (poly)saccharide degrading-CAZyme families as single and multi-modular domains. <bold>(B)</bold> Normalized count and fold difference of CAZyme families predicted to act on plant polysaccharides between poplar hydrolysate (PH)- and cellulose (C)-fed beaver dropping (BD) and moose rumen (MR) cultures. Fold difference was only calculated for non-zero counts.</p></caption>
<graphic xlink:href="fmicb-08-02504-g004.tif"/>
</fig>
<p>Carbohydrate-active enzymes families that were enriched through growth on poplar hydrolysate included those that comprise enzymes involved in plant polysaccharide deconstruction. For example, family GH43 includes enzymes that target arabinoxylan (<xref ref-type="bibr" rid="B14">Borsenberger et al., 2014</xref>; <xref ref-type="bibr" rid="B41">Mewis et al., 2016</xref>), family CE1 members were shown to deacetylate polymeric xylans (<xref ref-type="bibr" rid="B44">Neumuller et al., 2015</xref>; <xref ref-type="bibr" rid="B37">Mai-Gisondi et al., 2017</xref>), and family GH5 members include endoxylanases that targets xylans with or without methyl-glucuronic acid side chain (<xref ref-type="bibr" rid="B22">Gallardo et al., 2010</xref>), as well as enzymes that target cellulose and mannans (<xref ref-type="bibr" rid="B6">Aspeborg et al., 2012</xref>). Notably, enzymes belonging to families GH2 and GH3 were also abundant in the moose rumen microbiome, and predicted to participate in plant cell wall deconstruction (<xref ref-type="bibr" rid="B57">Svartstr&#x00F6;m et al., 2017</xref>). Characterized CE15 members display 4-<italic>O</italic>-methyl-glucuronoyl methylesterase activity, which are thought to hydrolyze ester linkages that may form between hydroxyl groups in lignin and 4-<italic>O</italic>-methyl-<sc>D</sc>-glucuronic acid residues in glucuronoxylans that dominate in hardwood fiber (<xref ref-type="bibr" rid="B11">Biely et al., 2015</xref>; <xref ref-type="bibr" rid="B10">Biely, 2016</xref>). Recently, a marine bacterial CE15 enzyme predicted to act on alginates was also reported, suggesting a broader substrate range for this CE family (<xref ref-type="bibr" rid="B17">De Santi et al., 2016</xref>; <xref ref-type="bibr" rid="B1">Agger et al., 2017</xref>). On the other hand, GH127 enzymes typically contain &#x03B2;-<sc>L</sc>-arabinofuranosidases that have been shown to target plant cell wall glycoproteins, such as extensin (<xref ref-type="bibr" rid="B21">Fujita et al., 2011</xref>). By contrast, between 3 and 13 times more GH74 sequences were identified in cellulose-fed enrichments compared to corresponding cultures enriched on poplar hydrolysate, fitting with the endoglucanase activity reported for this CAZyme family (<xref ref-type="bibr" rid="B56">Song et al., 2017</xref>). Similarly, 4.6 times more GH1 sequences were identified in the beaver dropping culture enriched on cellulose than that on poplar hydrolysate; characterized bacteria members from this family large act as &#x03B2;-glucosidases that hydrolyze cellobiose and soluble cellodextrins to glucose (<xref ref-type="bibr" rid="B54">Singhania et al., 2013</xref>). Interestingly, families capable of pectin degradation (PL1, PL9) were also found at higher abundances in the cellulose-fed beaver dropping culture than that fed with poplar hydrolysate.</p>
<p>Carbohydrate-binding modules can impact enzyme performance through targeting catalytic modules to polysaccharide substrates, and in some cases promote non-hydrolytic fiber disruption (<xref ref-type="bibr" rid="B13">Boraston et al., 2004</xref>; <xref ref-type="bibr" rid="B23">Gourlay et al., 2012</xref>); accordingly, CAZymes with cognate CBMs were also predicted from each metagenome sequence. About 20% of the sequences predicted to encode plant polysaccharides degrading enzymes (i.e., 669 sequences) were predicted to form multi-domain proteins (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S4</xref>). Most frequent domain organizations included CBMs, such as CBM48-GH13_9 (7&#x2013;8% in cellulose enrichments), GH9-CBM3-CBM3 (&#x223C;6% in moose rumen samples enriched on poplar hydrolysate), and CBM50-CBM50-GH18 (&#x223C;6% in beaver dropping and moose rumen samples enriched on poplar hydrolysate and cellulose, respectively). While CBM48-GH13 is a documented architecture for starch-degrading enzymes (<xref ref-type="bibr" rid="B36">Machovic and Janecek, 2008</xref>), the modular architecture GH9-CBM3-CBM3 was previously only reported as a non-cellulosomal enzyme encoded by <italic>Clostridium thermocellum</italic> (<xref ref-type="bibr" rid="B3">Anitori, 2012</xref>). CBM50-CBM50-GH18, like other GH18 chitinases with multiple CBM50 domains, was predicted to bind peptidoglycan-like and chitin-derived oligosaccharides (<xref ref-type="bibr" rid="B8">Bateman and Bycroft, 2000</xref>). Contrary to findings recently reported for the moose rumen microbiome (<xref ref-type="bibr" rid="B57">Svartstr&#x00F6;m et al., 2017</xref>), the multi-modular enzymes comprising CBM50 and GH23 or GH73 were identified at low abundance (&#x003C;3.5%) in the enriched moose rumen metagenomes reported herein.</p>
<p>In addition to multi-modular CAZymes comprising CBMs, those comprising potential cellulosomal subunits were also predicted. Cellulosomes are cell-associated multi-enzyme complexes that are produced by certain anaerobic bacteria to promote polysaccharide degradation (<xref ref-type="bibr" rid="B64">White et al., 2014</xref>; <xref ref-type="bibr" rid="B4">Artzi et al., 2017</xref>; <xref ref-type="bibr" rid="B55">Smith et al., 2017</xref>). When expressed as cell-bound cellulosomes (opposed to cell-free cellulosomes), the primary scaffoldins are connected through type II dockerin-cohesin interactions to specialized anchoring scaffoldins, which contain peptidoglycan-binding S-layer homology modules that anchor to the cell surface. Type I interactions, on the other hand, occur between the dockerin-containing enzymatic subunits and the cohesins on the primary scaffoldins.</p>
<p>For all enrichments, approximately twice the number of dockerins compared to cohesins were predicted (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>), and 56% of dockerins were appended to CAZyme sequences (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S5</xref>). The most frequently occurring CAZyme module was family GH9 (&#x223C;29%), followed by GH5 (&#x223C;11%), CE3 (&#x223C;8%), GH43 (&#x223C;7%), and GH3 (&#x223C;6%) (<bold>Figure <xref ref-type="fig" rid="F5">5</xref></bold> and Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S4</xref>). And unlike the recent study of the moose rumen metagenome, the recurrent GH13 appended-dockerins (<xref ref-type="bibr" rid="B57">Svartstr&#x00F6;m et al., 2017</xref>) were not identified in the current moose rumen metagenomes, likely due to their long enrichment on cellulosic carbon sources. Other common components of cellulosome systems (<xref ref-type="bibr" rid="B4">Artzi et al., 2017</xref>), such as GH10 (&#x223C;4%), GH11 (&#x223C;4%), and GH48 (&#x223C;4%) were also identified in the metagenomes of both moose rumen and beaver dropping enrichments, albeit at a lower abundance. Notably, the identification of few sequences containing a GH48 module and the approximately nine-fold higher number of those containing a GH9 module is consistent with the earlier analyses of cellulose-degrading anaerobic bacteria that generate high levels of a single GH48 and diverse GH9 enzymes with potential synergistic action (<xref ref-type="bibr" rid="B42">Morag et al., 1991</xref>; <xref ref-type="bibr" rid="B51">Ravachol et al., 2014</xref>; <xref ref-type="bibr" rid="B5">Artzi et al., 2015</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Catalog of domain architectures of top 11 abundant CAZy-dockerins in the cellulose- and poplar hydrolysate-fed microbial enrichments from beaver droppings and moose rumen. CBM, carbohydrate-binding module; CE, carbohydrate esterase; DOC1, type 1 dockerin; GH, glycoside hydrolases; PL, polysaccharide lyase.</p></caption>
<graphic xlink:href="fmicb-08-02504-g005.tif"/>
</fig>
</sec>
<sec><title>Predicted Polysaccharide Utilization Loci (PULs)</title>
<p>As summarized above, PULs have emerged as especially fruitful regions within genomic sequences for enzyme discovery (<xref ref-type="bibr" rid="B34">Larsbrink et al., 2016</xref>). Herein, 416 PULs were predicted (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S4</xref>), where the normalized number predicted from poplar hydrolysate-fed microcosms of beaver droppings was 4.5 times that predicted from cellulose-fed microcosms. Consistent with the overall distribution of predicted CAZyme sequences, those belonging to families CE1, GH3, and GH43, were most frequently identified in the predicted PULs (<bold>Figure <xref ref-type="fig" rid="F6">6A</xref></bold> and Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S6</xref>). Moreover, PULs comprising members of families GH127 and GH9 were exclusively identified in metagenomes from cultures enriched on poplar hydrolysate. Based on the family composition of a given PUL, substrate category of the PUL-encoded enzymes can be inferred. For example, <bold>Figure <xref ref-type="fig" rid="F6">6B</xref></bold> illustrates PULs that potentially target xylan and pectin based on the established activities of the CAZyme families. Sequences annotated as unknown may include novel enzyme functions, for instance as shown recently in the case of the type II rhamnogalacturonan PUL of <italic>B. thetaiotaomicron</italic> (<xref ref-type="bibr" rid="B43">Ndeh et al., 2017</xref>).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p><bold>(A)</bold> Top 15 most abundant CAZyme families identified in predicted PULs from cellulose (C)- and poplar hydrolysate (PH)-fed microbial enrichments of beaver droppings and moose rumen. <bold>(B)</bold> Examples of predicted PULs from beaver droppings enriched on poplar hydrolysate (BD-PH). <bold>(C)</bold> Similarity-based clustering (&#x2265;70%) of proteins with unknown function positioned in PULs identified herein and listed in the public PUL database (<ext-link ext-link-type="uri" xlink:href="http://www.cazy.org/PULDB/">http://www.cazy.org/PULDB/</ext-link>). Each cluster contains a central node that denotes the representative protein with unknown function (defined by the longest length) and connected nodes that represent a protein with unknown function that is &#x2265;70% identical to the representative sequence (see the section &#x201C;Materials and Methods&#x201D;). PUL identifiers are shown on each node; the thickness of the edges correlates to percent identity between sequences. Circled in red and blue are proteins with unknown functions that are &#x2265;95% identical to one another; the architecture of PULs circled in red is identical, whereas those circled in blue share a common central architecture but differ at flanking regions. Circled in purple is the only cluster that comprises proteins with unknown function from both PULs predicted herein and those from the public PUL database.</p></caption>
<graphic xlink:href="fmicb-08-02504-g006.tif"/>
</fig>
<p>Of note, 620 sequences annotated as proteins with unknown function (with lengths ranging from 32 to 1,320 amino acids) were identified in all candidate PULs (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S5A</xref>). Among these, eight sequences annotated as proteins with unknown function were found to comprise a CBM from family CBM32, CBM35, CBM51, or CBM66. In an effort to prioritize additional sequences for future characterization, a clustering network diagram was generated to uncover protein sequences with unknown function that reoccurred in the predicted PULs. However, little similarity was revealed between such sequences from PULs predicted herein and those reported in the public PULDB (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S5B</xref>). In fact, only one such sequence from beaver droppings enriched on poplar hydrolysate was &#x2265;70% identical to those annotated in the PULDB, and the few sequences with unknown function that did cluster typically originated from PULs with similar architecture (<bold>Figure <xref ref-type="fig" rid="F6">6C</xref></bold> and Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S4</xref>).</p>
</sec>
<sec><title>Predicted Multi-Modular Proteins &#x2013; An Additional Source of Yet Unknown Carbohydrate-Active Proteins</title>
<p>A second approach to assist the discovery of potentially new CAZyme families considered multi-modular proteins predicted to comprise a DUF, or a sequence of unknown function, appended to a CBM or dockerins (cellulosomal subunit).</p>
<p>Considering all four metagenome sequences reported herein, 62 DUFs were identified that co-occurred with a CBM (<bold>Figure <xref ref-type="fig" rid="F7">7</xref></bold> and Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S6</xref>). The most frequent organizations were: DUF3794-CBM50 (10 identified), DUF362-CBM9-DOC1 (4 identified), DUF4366-CBM16 (4 identified), which were identified in all four metagenomes; five DUF3459-CBM48-GH13_10 sequences were also identified in the metagenome of beaver droppings enriched on poplar hydrolysate (Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S6</xref>). As shown herein and also described in the Pfam database (<xref ref-type="bibr" rid="B20">Finn et al., 2016</xref>), DUF3794 was often found in association with CBM50. On the other hand, DUF362 is often present in proteins with domains that bind to iron&#x2013;sulfur clusters, and its coexistence with CBM9_1 in an uncharacterized protein from soil bacteria <italic>Sorangium cellulosum</italic> was previously observed (UniProt entry S4XJL8). The structure of DUF3459 has been determined (UniProt entries B2IUW9, Q9RX51, Q8ZPF0, Q8P5I2, Q2PS28, M1E1F6, M1E1F3, H3K096), and as observed here, was previously shown to be part of multi-modular proteins comprising GH13 and CBM48 domains (UniProt entries W6LS46, R4KHQ4, C7RTS8). Although not frequently observed, one PUL identified in the poplar hydrolysate-fed beaver droppings culture contained DUF5005 appended to a predicted CBM32 (<bold>Figure <xref ref-type="fig" rid="F6">6B</xref></bold>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>Carbohydrate-active proteins with domains of unknown functions (DUFs) identified in the metagenomes. In bold are the DUFs that are identified with various CBMs and CAZymes as shown via the connections color-coded in accordance to the DUFs. The number and corresponding percentage of each combination of modules are shown in the outer scale.</p></caption>
<graphic xlink:href="fmicb-08-02504-g007.tif"/>
</fig>
<p>Of the predicted dockerin sequences, 44% lacked known appended CAZyme modules. Similar to previous reports (<xref ref-type="bibr" rid="B20">Finn et al., 2016</xref>), a few dockerin sequences were predicted to have appended DUF (i.e., DUF362, DUF1533, and DUF3237); however, the majority were not annotated as containing modules or domains functionally attributed to cellulosomes. In many cases, this could reflect sequence gaps due to incomplete metagenome assembly; however, it is also conceivable that dockerin&#x2013;cohesin proteins might in fact participate in other biological functions, as suggested by a phylogenetically distinct group of cohesins discovered in the cow rumen metagenome (<xref ref-type="bibr" rid="B9">Bensoussan et al., 2017</xref>).</p>
</sec>
</sec>
<sec><title>Conclusion</title>
<p>Given their natural dietary habits, the Canadian beaver and North American moose have likely evolved digestive microbiomes with the ability to degrade diverse wood polysaccharides. To identify enzymes that may be most relevant to wood fiber bioprocessing, corresponding microbial communities were enriched for approximately 3 years on comparatively complex (poplar hydrolysate) and defined (microcrystalline cellulose) carbon sources. Enrichment led to substrate-induced convergence of CAZyme profiles, which significantly narrowed the number of CAZyme families and corresponding members that could be targeted and tested for improved enzymatic conversion of wood fiber. For example, in addition to families GH2, GH3, GH5, and GH43 which previous reports have also identified, GH127 and CE15 may be especially relevant for the anaerobic conversion of pretreated wood fiber. Protein sequences containing both a CBM and a DUF, as well as proteins with unknown function yet having signals for secretion and position within PULs, were also identified and may facilitate the discovery of new CAZyme activities. Proteomic analysis of secretomes from the enrichment cultures prepared herein will provide an additional filter for protein selection and characterization. In the interim, however, enrichment followed by comparative metagenomics sufficiently narrowed protein lists of primary interest, enabling direct recombinant production and characterization.</p>
</sec>
<sec><title>Author Contributions</title>
<p>MW performed the sequence analyses, data interpretation, and compiled the manuscript. WW maintained the enrichment cultures, prepared DNA samples for sequencing, and contributed to data interpretation. MC and FR contributed to data interpretation. BH, NT, VL, and PL contributed to the search and annotation of CAZyme modules and PULs, as well as data interpretation. EM and EE conceived and coordinated the study. All authors contributed to the revision of manuscript and approved the final version.</p>
</sec>
<sec><title>Conflict of Interest Statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> This work was funded by the Government of Ontario for the project &#x201C;Forest FAB: Applied Genomics for Functionalized Fibre and Biochemicals&#x201D; (ORF-RE-05-005), the Natural Sciences and Engineering Research Council of Canada for the Strategic Network Grant &#x201C;Industrial Biocatalysis Network,&#x201D; the European Research Council (ERC) Grant Agreement 322820 to BH and an ERC Consolidator Grant to EM (BHIVE &#x2013; 648925). MW was funded by a University of Toronto Fellowship and Professor William F. Graydon Memorial Graduate Fellowship. MC was funded by a Marie Curie International Outgoing Fellowship within the 7th European Community Framework Program.</p></fn>
</fn-group>
<ack>
<p>The authors would like to thank C. Washer and O. Molenda for training on using the Trimmomatic and AbySS assembly programs, and also W. Gao and D. Robson for IT support.</p>
</ack>
<sec sec-type="supplementary material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2017.02504/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmicb.2017.02504/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Presentation_1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Agger</surname> <given-names>J. W.</given-names></name> <name><surname>Busk</surname> <given-names>P. K.</given-names></name> <name><surname>Pilgaard</surname> <given-names>B.</given-names></name> <name><surname>Meyer</surname> <given-names>A. S.</given-names></name> <name><surname>Lange</surname> <given-names>L.</given-names></name></person-group> (<year>2017</year>). <article-title>A new functional classification of glucuronoyl esterases by peptide pattern recognition.</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>8</volume>:<issue>309</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2017.00309</pub-id> <pub-id pub-id-type="pmid">28293230</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Al-Masaudi</surname> <given-names>S.</given-names></name> <name><surname>El Kaoutari</surname> <given-names>A.</given-names></name> <name><surname>Drula</surname> <given-names>E.</given-names></name> <name><surname>Al-Mehdar</surname> <given-names>H.</given-names></name> <name><surname>Redwan</surname> <given-names>E. M.</given-names></name> <name><surname>Lombard</surname> <given-names>V.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>A metagenomics investigation of carbohydrate-active enzymes along the gastrointestinal tract of Saudi sheep.</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>8</volume>:<issue>666</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2017.00666</pub-id> <pub-id pub-id-type="pmid">28473812</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anitori</surname> <given-names>R. P.</given-names></name></person-group> (<year>2012</year>). <source><italic>Extremophiles: Microbiology and Biotechnology</italic>.</source> <publisher-loc>Poole</publisher-loc>: <publisher-name>Caister Academic Press</publisher-name>.</citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Artzi</surname> <given-names>L.</given-names></name> <name><surname>Bayer</surname> <given-names>E. A.</given-names></name> <name><surname>Morais</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). <article-title>Cellulosomes: bacterial nanomachines for dismantling plant polysaccharides.</article-title> <source><italic>Nat. Rev. Microbiol.</italic></source> <volume>15</volume> <fpage>83</fpage>&#x2013;<lpage>95</lpage>. <pub-id pub-id-type="doi">10.1038/nrmicro.2016.164</pub-id> <pub-id pub-id-type="pmid">27941816</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Artzi</surname> <given-names>L.</given-names></name> <name><surname>Morag</surname> <given-names>E.</given-names></name> <name><surname>Barak</surname> <given-names>Y.</given-names></name> <name><surname>Lamed</surname> <given-names>R.</given-names></name> <name><surname>Bayer</surname> <given-names>E. A.</given-names></name></person-group> (<year>2015</year>). <article-title><italic>Clostridium clariflavum</italic>: key cellulosome players are revealed by proteomic analysis.</article-title> <source><italic>mBio</italic></source> <volume>6</volume>:<issue>e00411-15</issue>. <pub-id pub-id-type="doi">10.1128/mBio.00411-15</pub-id> <pub-id pub-id-type="pmid">25991683</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aspeborg</surname> <given-names>H.</given-names></name> <name><surname>Coutinho</surname> <given-names>P. M.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Brumer</surname> <given-names>H.</given-names></name> <name><surname>Henrissat</surname> <given-names>B.</given-names></name></person-group> (<year>2012</year>). <article-title>Evolution, substrate specificity and subfamily classification of glycoside hydrolase family 5 (GH5).</article-title> <source><italic>BMC Evol. Biol.</italic></source> <volume>12</volume>:<issue>186</issue>. <pub-id pub-id-type="doi">10.1186/1471-2148-12-186</pub-id> <pub-id pub-id-type="pmid">22992189</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bagenholm</surname> <given-names>V.</given-names></name> <name><surname>Reddy</surname> <given-names>S. K.</given-names></name> <name><surname>Bouraoui</surname> <given-names>H.</given-names></name> <name><surname>Morrill</surname> <given-names>J.</given-names></name> <name><surname>Kulcinskaja</surname> <given-names>E.</given-names></name> <name><surname>Bahr</surname> <given-names>C. M.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Galactomannan catabolism conferred by a polysaccharide utilization locus of <italic>Bacteroides ovatus</italic>- enzyme synergy and crystal structure of a beta-mannanase.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>292</volume> <fpage>229</fpage>&#x2013;<lpage>243</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M116.746438</pub-id> <pub-id pub-id-type="pmid">27872187</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bateman</surname> <given-names>A.</given-names></name> <name><surname>Bycroft</surname> <given-names>M.</given-names></name></person-group> (<year>2000</year>). <article-title>The structure of a LysM domain from <italic>E. coli</italic> membrane-bound lytic murein transglycosylase D (MltD).</article-title> <source><italic>J. Mol. Biol.</italic></source> <volume>299</volume> <fpage>1113</fpage>&#x2013;<lpage>1119</lpage>. <pub-id pub-id-type="doi">10.1006/jmbi.2000.3778</pub-id> <pub-id pub-id-type="pmid">10843862</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bensoussan</surname> <given-names>L.</given-names></name> <name><surname>Morais</surname> <given-names>S.</given-names></name> <name><surname>Dassa</surname> <given-names>B.</given-names></name> <name><surname>Friedman</surname> <given-names>N.</given-names></name> <name><surname>Henrissat</surname> <given-names>B.</given-names></name> <name><surname>Lombard</surname> <given-names>V.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Broad phylogeny and functionality of cellulosomal components in the bovine rumen microbiome.</article-title> <source><italic>Environ. Microbiol.</italic></source> <volume>19</volume> <fpage>185</fpage>&#x2013;<lpage>197</lpage>. <pub-id pub-id-type="doi">10.1111/1462-2920.13561</pub-id> <pub-id pub-id-type="pmid">27712009</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Biely</surname> <given-names>P.</given-names></name></person-group> (<year>2016</year>). <article-title>Microbial glucuronoyl esterases: 10 years after discovery.</article-title> <source><italic>Appl. Environ. Microbiol.</italic></source> <volume>82</volume> <fpage>7014</fpage>&#x2013;<lpage>7018</lpage>. <pub-id pub-id-type="doi">10.1128/AEM.02396-16</pub-id> <pub-id pub-id-type="pmid">27694239</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Biely</surname> <given-names>P.</given-names></name> <name><surname>Malovikova</surname> <given-names>A.</given-names></name> <name><surname>Uhliarikova</surname> <given-names>I.</given-names></name> <name><surname>Li</surname> <given-names>X. L.</given-names></name> <name><surname>Wong</surname> <given-names>D. W. S.</given-names></name></person-group> (<year>2015</year>). <article-title>Glucuronoyl esterases are active on the polymeric substrate methyl esterified glucuronoxylan.</article-title> <source><italic>FEBS Lett.</italic></source> <volume>589</volume> <fpage>2334</fpage>&#x2013;<lpage>2339</lpage>. <pub-id pub-id-type="doi">10.1016/j.febslet.2015.07.019</pub-id> <pub-id pub-id-type="pmid">26216754</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bolger</surname> <given-names>A. M.</given-names></name> <name><surname>Lohse</surname> <given-names>M.</given-names></name> <name><surname>Usadel</surname> <given-names>B.</given-names></name></person-group> (<year>2014</year>). <article-title>Trimmomatic: a flexible trimmer for Illumina sequence data.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>2114</fpage>&#x2013;<lpage>2120</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu170</pub-id> <pub-id pub-id-type="pmid">24695404</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Boraston</surname> <given-names>A. B.</given-names></name> <name><surname>Bolam</surname> <given-names>D. N.</given-names></name> <name><surname>Gilbert</surname> <given-names>H. J.</given-names></name> <name><surname>Davies</surname> <given-names>G. J.</given-names></name></person-group> (<year>2004</year>). <article-title>Carbohydrate-binding modules: fine-tuning polysaccharide recognition.</article-title> <source><italic>Biochem. J.</italic></source> <volume>382</volume> <fpage>769</fpage>&#x2013;<lpage>781</lpage>. <pub-id pub-id-type="doi">10.1042/BJ20040892</pub-id> <pub-id pub-id-type="pmid">15214846</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Borsenberger</surname> <given-names>V.</given-names></name> <name><surname>Dornez</surname> <given-names>E.</given-names></name> <name><surname>Desrousseaux</surname> <given-names>M. L.</given-names></name> <name><surname>Massou</surname> <given-names>S.</given-names></name> <name><surname>Tenkanen</surname> <given-names>M.</given-names></name> <name><surname>Courtin</surname> <given-names>C. M.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>A H-1 NMR study of the specificity of alpha-L-arabinofuranosidases on natural and unnatural substrates.</article-title> <source><italic>Biochim. Biophys. Acta</italic></source> <volume>1840</volume> <fpage>3106</fpage>&#x2013;<lpage>3114</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbagen.2014.07.001</pub-id> <pub-id pub-id-type="pmid">25016078</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chaney</surname> <given-names>W. R.</given-names></name></person-group> (<year>2003</year>). <source><italic>Why Do Animals Eat the Bark and Wood of Trees and Shrubs?</italic></source> <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://www.extension.purdue.edu/extmedia/fnr/fnr_203.pdf">https://www.extension.purdue.edu/extmedia/fnr/fnr_203.pdf</ext-link> [accessed October 8, 2017]</comment>.</citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Damon</surname> <given-names>C.</given-names></name> <name><surname>Lehembre</surname> <given-names>F.</given-names></name> <name><surname>Oger-Desfeux</surname> <given-names>C.</given-names></name> <name><surname>Luis</surname> <given-names>P.</given-names></name> <name><surname>Ranger</surname> <given-names>J.</given-names></name> <name><surname>Fraissinet-Tachet</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Metatranscriptomics reveals the diversity of genes expressed by eukaryotes in forest soils.</article-title> <source><italic>PLOS ONE</italic></source> <volume>7</volume>:<issue>e28967</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0028967</pub-id> <pub-id pub-id-type="pmid">22238585</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Santi</surname> <given-names>C.</given-names></name> <name><surname>Willassen</surname> <given-names>N. P.</given-names></name> <name><surname>Williamson</surname> <given-names>A.</given-names></name></person-group> (<year>2016</year>). <article-title>Biochemical characterization of a family 15 carbohydrate esterase from a bacterial marine arctic metagenome.</article-title> <source><italic>PLOS ONE</italic></source> <volume>11</volume>:<issue>e0159345</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0159345</pub-id> <pub-id pub-id-type="pmid">27433797</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>DeAngelis</surname> <given-names>K. M.</given-names></name> <name><surname>Silver</surname> <given-names>W. L.</given-names></name> <name><surname>Thompson</surname> <given-names>A. W.</given-names></name> <name><surname>Firestone</surname> <given-names>M. K.</given-names></name></person-group> (<year>2010</year>). <article-title>Microbial communities acclimate to recurring changes in soil redox potential status.</article-title> <source><italic>Environ. Microbiol.</italic></source> <volume>12</volume> <fpage>3137</fpage>&#x2013;<lpage>3149</lpage>. <pub-id pub-id-type="doi">10.1111/j.1462-2920.2010.02286.x</pub-id> <pub-id pub-id-type="pmid">20629704</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Excoffier</surname> <given-names>G.</given-names></name> <name><surname>Toussaint</surname> <given-names>B.</given-names></name> <name><surname>Vignon</surname> <given-names>M. R.</given-names></name></person-group> (<year>1991</year>). <article-title>Saccharification of steam-exploded poplar wood.</article-title> <source><italic>Biotechnol. Bioeng.</italic></source> <volume>38</volume> <fpage>1308</fpage>&#x2013;<lpage>1317</lpage>. <pub-id pub-id-type="doi">10.1002/bit.260381108</pub-id> <pub-id pub-id-type="pmid">18600732</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Finn</surname> <given-names>R. D.</given-names></name> <name><surname>Coggill</surname> <given-names>P.</given-names></name> <name><surname>Eberhardt</surname> <given-names>R. Y.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name> <name><surname>Mistry</surname> <given-names>J.</given-names></name> <name><surname>Mitchell</surname> <given-names>A. L.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>The Pfam protein families database: towards a more sustainable future.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>44</volume> <fpage>D279</fpage>&#x2013;<lpage>D285</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv1344</pub-id> <pub-id pub-id-type="pmid">26673716</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fujita</surname> <given-names>K.</given-names></name> <name><surname>Sakamoto</surname> <given-names>S.</given-names></name> <name><surname>Ono</surname> <given-names>Y.</given-names></name> <name><surname>Wakao</surname> <given-names>M.</given-names></name> <name><surname>Suda</surname> <given-names>Y.</given-names></name> <name><surname>Kitahara</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Molecular cloning and characterization of a beta-l-arabinobiosidase in <italic>Bifidobacterium longum</italic> that belongs to a novel glycoside hydrolase family.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>286</volume> <fpage>5143</fpage>&#x2013;<lpage>5150</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M110.190512</pub-id> <pub-id pub-id-type="pmid">21149454</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gallardo</surname> <given-names>O.</given-names></name> <name><surname>Fernandez-Fernandez</surname> <given-names>M.</given-names></name> <name><surname>Valls</surname> <given-names>C.</given-names></name> <name><surname>Valenzuela</surname> <given-names>S. V.</given-names></name> <name><surname>Roncero</surname> <given-names>M. B.</given-names></name> <name><surname>Vidal</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Characterization of a family GH5 xylanase with activity on neutral oligosaccharides and evaluation as a pulp bleaching aid.</article-title> <source><italic>Appl. Environ. Microbiol.</italic></source> <volume>76</volume> <fpage>6290</fpage>&#x2013;<lpage>6294</lpage>. <pub-id pub-id-type="doi">10.1128/AEM.00871-10</pub-id> <pub-id pub-id-type="pmid">20656870</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gourlay</surname> <given-names>K.</given-names></name> <name><surname>Arantes</surname> <given-names>V.</given-names></name> <name><surname>Saddler</surname> <given-names>J. N.</given-names></name></person-group> (<year>2012</year>). <article-title>Use of substructure-specific carbohydrate binding modules to track changes in cellulose accessibility and surface morphology during the amorphogenesis step of enzymatic hydrolysis.</article-title> <source><italic>Biotechnol. Biofuels</italic></source> <volume>5</volume>:<issue>51</issue>. <pub-id pub-id-type="doi">10.1186/1754-6834-5-51</pub-id> <pub-id pub-id-type="pmid">22828270</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>He</surname> <given-names>S. M.</given-names></name> <name><surname>Ivanova</surname> <given-names>N.</given-names></name> <name><surname>Kirton</surname> <given-names>E.</given-names></name> <name><surname>Allgaier</surname> <given-names>M.</given-names></name> <name><surname>Bergin</surname> <given-names>C.</given-names></name> <name><surname>Scheffrahn</surname> <given-names>R. H.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Comparative metagenomic and metatranscriptomic analysis of hindgut paunch microbiota in wood- and dung-feeding higher termites.</article-title> <source><italic>PLOS ONE</italic></source> <volume>8</volume>:<issue>e61126</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0061126</pub-id> <pub-id pub-id-type="pmid">23593407</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Heiss-Blanquet</surname> <given-names>S.</given-names></name> <name><surname>Fayolle-Guichard</surname> <given-names>F.</given-names></name> <name><surname>Lombard</surname> <given-names>V.</given-names></name> <name><surname>Hebert</surname> <given-names>A.</given-names></name> <name><surname>Coutinho</surname> <given-names>P. M.</given-names></name> <name><surname>Groppi</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Composting-like conditions are more efficient for enrichment and diversity of organisms containing cellulase-encoding genes than submerged cultures.</article-title> <source><italic>PLOS ONE</italic></source> <volume>11</volume>:<issue>e0167216</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0167216</pub-id> <pub-id pub-id-type="pmid">27936240</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hess</surname> <given-names>M.</given-names></name> <name><surname>Sczyrba</surname> <given-names>A.</given-names></name> <name><surname>Egan</surname> <given-names>R.</given-names></name> <name><surname>Kim</surname> <given-names>T. W.</given-names></name> <name><surname>Chokhawala</surname> <given-names>H.</given-names></name> <name><surname>Schroth</surname> <given-names>G.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Metagenomic discovery of biomass-degrading genes and genomes from cow rumen.</article-title> <source><italic>Science</italic></source> <volume>331</volume> <fpage>463</fpage>&#x2013;<lpage>467</lpage>. <pub-id pub-id-type="doi">10.1126/science.1200387</pub-id> <pub-id pub-id-type="pmid">21273488</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hood</surname> <given-names>G. A.</given-names></name> <name><surname>Bayley</surname> <given-names>S. E.</given-names></name></person-group> (<year>2009</year>). <article-title>A comparison of riparian plant community response to herbivory by beavers (<italic>Castor canadensis</italic>) and ungulates in Canada&#x2019;s boreal mixed-wood forest.</article-title> <source><italic>For. Ecol. Manage.</italic></source> <volume>258</volume> <fpage>1979</fpage>&#x2013;<lpage>1989</lpage>. <pub-id pub-id-type="doi">10.1016/j.foreco.2009.07.052</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Niu</surname> <given-names>B. F.</given-names></name> <name><surname>Gao</surname> <given-names>Y.</given-names></name> <name><surname>Fu</surname> <given-names>L. M.</given-names></name> <name><surname>Li</surname> <given-names>W. Z.</given-names></name></person-group> (<year>2010</year>). <article-title>CD-HIT suite: a web server for clustering and comparing biological sequences.</article-title> <source><italic>Bioinformatics</italic></source> <volume>26</volume> <fpage>680</fpage>&#x2013;<lpage>682</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btq003</pub-id> <pub-id pub-id-type="pmid">20053844</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hyatt</surname> <given-names>D.</given-names></name> <name><surname>Chen</surname> <given-names>G. L.</given-names></name> <name><surname>Locascio</surname> <given-names>P. F.</given-names></name> <name><surname>Land</surname> <given-names>M. L.</given-names></name> <name><surname>Larimer</surname> <given-names>F. W.</given-names></name> <name><surname>Hauser</surname> <given-names>L. J.</given-names></name></person-group> (<year>2010</year>). <article-title>Prodigal: prokaryotic gene recognition and translation initiation site identification.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>11</volume>:<issue>119</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-11-119</pub-id> <pub-id pub-id-type="pmid">20211023</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jimen&#x00E9;z</surname> <given-names>D. J.</given-names></name> <name><surname>Brossi</surname> <given-names>M. J. D.</given-names></name> <name><surname>Schuckel</surname> <given-names>J.</given-names></name> <name><surname>Kracun</surname> <given-names>S. K.</given-names></name> <name><surname>Willats</surname> <given-names>W. G. T.</given-names></name> <name><surname>Van Elsas</surname> <given-names>J. D.</given-names></name></person-group> (<year>2016</year>). <article-title>Characterization of three plant biomass-degrading microbial consortia by metagenomics- and metasecretomics-based approaches.</article-title> <source><italic>Appl. Microbiol. Biotechnol.</italic></source> <volume>100</volume> <fpage>10463</fpage>&#x2013;<lpage>10477</lpage>. <pub-id pub-id-type="doi">10.1007/s00253-016-7713-3</pub-id> <pub-id pub-id-type="pmid">27418359</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname> <given-names>P.</given-names></name> <name><surname>Binns</surname> <given-names>D.</given-names></name> <name><surname>Chang</surname> <given-names>H. Y.</given-names></name> <name><surname>Fraser</surname> <given-names>M.</given-names></name> <name><surname>Li</surname> <given-names>W. Z.</given-names></name> <name><surname>Mcanulla</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>InterProScan 5: genome-scale protein function classification.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>1236</fpage>&#x2013;<lpage>1240</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu031</pub-id> <pub-id pub-id-type="pmid">24451626</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krzywinski</surname> <given-names>M.</given-names></name> <name><surname>Schein</surname> <given-names>J.</given-names></name> <name><surname>Birol</surname> <given-names>I.</given-names></name> <name><surname>Connors</surname> <given-names>J.</given-names></name> <name><surname>Gascoyne</surname> <given-names>R.</given-names></name> <name><surname>Horsman</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Circos: an information aesthetic for comparative genomics.</article-title> <source><italic>Genome Res.</italic></source> <volume>19</volume> <fpage>1639</fpage>&#x2013;<lpage>1645</lpage>. <pub-id pub-id-type="doi">10.1101/gr.092759.109</pub-id> <pub-id pub-id-type="pmid">19541911</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>R.</given-names></name> <name><surname>Singh</surname> <given-names>S.</given-names></name> <name><surname>Singh</surname> <given-names>O. V.</given-names></name></person-group> (<year>2008</year>). <article-title>Bioconversion of lignocellulosic biomass: biochemical and molecular perspectives.</article-title> <source><italic>J. Ind. Microbiol. Biotechnol.</italic></source> <volume>35</volume> <fpage>377</fpage>&#x2013;<lpage>391</lpage>. <pub-id pub-id-type="doi">10.1007/s10295-008-0327-8</pub-id> <pub-id pub-id-type="pmid">18338189</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larsbrink</surname> <given-names>J.</given-names></name> <name><surname>Zhu</surname> <given-names>Y.</given-names></name> <name><surname>Kharade</surname> <given-names>S. S.</given-names></name> <name><surname>Kwiatkowski</surname> <given-names>K. J.</given-names></name> <name><surname>Eijsink</surname> <given-names>V. G. H.</given-names></name> <name><surname>Koropatkin</surname> <given-names>N. M.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>A polysaccharide utilization locus from <italic>Flavobacterium johnsoniae</italic> enables conversion of recalcitrant chitin.</article-title> <source><italic>Biotechnol. Biofuels</italic></source> <volume>9</volume>:<issue>260</issue>. <pub-id pub-id-type="doi">10.1186/s13068-016-0674-z</pub-id> <pub-id pub-id-type="pmid">27933102</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lombard</surname> <given-names>V.</given-names></name> <name><surname>Ramulu</surname> <given-names>H. G.</given-names></name> <name><surname>Drula</surname> <given-names>E.</given-names></name> <name><surname>Coutinho</surname> <given-names>P. M.</given-names></name> <name><surname>Henrissat</surname> <given-names>B.</given-names></name></person-group> (<year>2014</year>). <article-title>The carbohydrate-active enzymes database (CAZy) in 2013.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>42</volume> <fpage>D490</fpage>&#x2013;<lpage>D495</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt1178</pub-id> <pub-id pub-id-type="pmid">24270786</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Machovic</surname> <given-names>M.</given-names></name> <name><surname>Janecek</surname> <given-names>S.</given-names></name></person-group> (<year>2008</year>). <article-title>Domain evolution in the GH13 pullulanase subfamily with focus on the carbohydrate-binding module family 48.</article-title> <source><italic>Biologia</italic></source> <volume>63</volume> <fpage>1057</fpage>&#x2013;<lpage>1068</lpage>. <pub-id pub-id-type="doi">10.2478/s11756-008-0162-4</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mai-Gisondi</surname> <given-names>G.</given-names></name> <name><surname>Maaheimo</surname> <given-names>H.</given-names></name> <name><surname>Chong</surname> <given-names>S. L.</given-names></name> <name><surname>Hinz</surname> <given-names>S.</given-names></name> <name><surname>Tenkanen</surname> <given-names>M.</given-names></name> <name><surname>Master</surname> <given-names>E.</given-names></name></person-group> (<year>2017</year>). <article-title>Functional comparison of versatile carbohydrate esterases from families CE1, CE6 and CE16 on acetyl-4-O-methylglucuronoxylan and acetyl-galactoglucomannan.</article-title> <source><italic>Biochim. Biophys. Acta</italic></source> <volume>1861</volume> <fpage>2398</fpage>&#x2013;<lpage>2405</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbagen.2017.06.002</pub-id> <pub-id pub-id-type="pmid">28591625</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Menzel</surname> <given-names>P.</given-names></name> <name><surname>Ng</surname> <given-names>K. L.</given-names></name> <name><surname>Krogh</surname> <given-names>A.</given-names></name></person-group> (<year>2016</year>). <article-title>Fast and sensitive taxonomic classification for metagenomics with Kaiju.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>7</volume>:<issue>11257</issue>. <pub-id pub-id-type="doi">10.1038/ncomms11257</pub-id> <pub-id pub-id-type="pmid">27071849</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mesnage</surname> <given-names>S.</given-names></name> <name><surname>Fontaine</surname> <given-names>T.</given-names></name> <name><surname>Mignot</surname> <given-names>T.</given-names></name> <name><surname>Delepierre</surname> <given-names>M.</given-names></name> <name><surname>Mock</surname> <given-names>M.</given-names></name> <name><surname>Fouet</surname> <given-names>A.</given-names></name></person-group> (<year>2000</year>). <article-title>Bacterial SLH domain proteins are non-covalently anchored to the cell surface via a conserved mechanism involving wall polysaccharide pyruvylation.</article-title> <source><italic>EMBO J.</italic></source> <volume>19</volume> <fpage>4473</fpage>&#x2013;<lpage>4484</lpage>. <pub-id pub-id-type="doi">10.1093/emboj/19.17.4473</pub-id> <pub-id pub-id-type="pmid">10970841</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Metsalu</surname> <given-names>T.</given-names></name> <name><surname>Vilo</surname> <given-names>J.</given-names></name></person-group> (<year>2015</year>). <article-title>ClustVis: a web tool for visualizing clustering of multivariate data using Principal Component Analysis and heatmap.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>W566</fpage>&#x2013;<lpage>W570</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv468</pub-id> <pub-id pub-id-type="pmid">25969447</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mewis</surname> <given-names>K.</given-names></name> <name><surname>Lenfant</surname> <given-names>N.</given-names></name> <name><surname>Lombard</surname> <given-names>V.</given-names></name> <name><surname>Henrissat</surname> <given-names>B.</given-names></name></person-group> (<year>2016</year>). <article-title>Dividing the large glycoside hydrolase family 43 into subfamilies: a motivation for detailed enzyme characterization.</article-title> <source><italic>Appl. Environ. Microbiol.</italic></source> <volume>82</volume> <fpage>1686</fpage>&#x2013;<lpage>1692</lpage>. <pub-id pub-id-type="doi">10.1128/AEM.03453-15</pub-id> <pub-id pub-id-type="pmid">26729713</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morag</surname> <given-names>E.</given-names></name> <name><surname>Halevy</surname> <given-names>I.</given-names></name> <name><surname>Bayer</surname> <given-names>E. A.</given-names></name> <name><surname>Lamed</surname> <given-names>R.</given-names></name></person-group> (<year>1991</year>). <article-title>Isolation and properties of a major cellobiohydrolase from the cellulosome of <italic>Clostridium thermocellum</italic>.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>173</volume> <fpage>4155</fpage>&#x2013;<lpage>4162</lpage>. <pub-id pub-id-type="doi">10.1128/jb.173.13.4155-4162.1991</pub-id> <pub-id pub-id-type="pmid">2061292</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ndeh</surname> <given-names>D.</given-names></name> <name><surname>Rogowski</surname> <given-names>A.</given-names></name> <name><surname>Cartmell</surname> <given-names>A.</given-names></name> <name><surname>Luis</surname> <given-names>A. S.</given-names></name> <name><surname>Basle</surname> <given-names>A.</given-names></name> <name><surname>Gray</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Complex pectin metabolism by gut bacteria reveals novel catalytic functions.</article-title> <source><italic>Nature</italic></source> <volume>544</volume> <fpage>65</fpage>&#x2013;<lpage>70</lpage>. <pub-id pub-id-type="doi">10.1038/nature21725</pub-id> <pub-id pub-id-type="pmid">28329766</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Neumuller</surname> <given-names>K. G.</given-names></name> <name><surname>De Souza</surname> <given-names>A. C.</given-names></name> <name><surname>Van Rijn</surname> <given-names>J. H. J.</given-names></name> <name><surname>Streekstra</surname> <given-names>H.</given-names></name> <name><surname>Gruppen</surname> <given-names>H.</given-names></name> <name><surname>Schols</surname> <given-names>H. A.</given-names></name></person-group> (<year>2015</year>). <article-title>Positional preferences of acetyl esterases from different CE families towards acetylated 4-O-methyl glucuronic acid-substituted xylo-oligosaccharides.</article-title> <source><italic>Biotechnol. Biofuels</italic></source> <volume>8</volume>:<issue>7</issue>. <pub-id pub-id-type="doi">10.1186/s13068-014-0187-6</pub-id> <pub-id pub-id-type="pmid">25642285</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>O&#x2019;Connor</surname> <given-names>R. M.</given-names></name> <name><surname>Fung</surname> <given-names>J. M.</given-names></name> <name><surname>Sharp</surname> <given-names>K. H.</given-names></name> <name><surname>Benner</surname> <given-names>J. S.</given-names></name> <name><surname>Mcclung</surname> <given-names>C.</given-names></name> <name><surname>Cushing</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Gill bacteria enable a novel digestive strategy in a wood-feeding mollusk.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>111</volume> <fpage>E5096</fpage>&#x2013;<lpage>E5104</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1413110111</pub-id> <pub-id pub-id-type="pmid">25385629</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Patrascu</surname> <given-names>O.</given-names></name> <name><surname>Beguet-Crespel</surname> <given-names>F.</given-names></name> <name><surname>Marinelli</surname> <given-names>L.</given-names></name> <name><surname>Le Chatelier</surname> <given-names>E.</given-names></name> <name><surname>Abraham</surname> <given-names>A. L.</given-names></name> <name><surname>Leclerc</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>A fibrolytic potential in the human ileum mucosal microbiota revealed by functional metagenomic.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>7</volume>:<issue>40248</issue>. <pub-id pub-id-type="doi">10.1038/srep40248</pub-id> <pub-id pub-id-type="pmid">28091525</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peng</surname> <given-names>F.</given-names></name> <name><surname>Peng</surname> <given-names>P.</given-names></name> <name><surname>Xu</surname> <given-names>F.</given-names></name> <name><surname>Sun</surname> <given-names>R. C.</given-names></name></person-group> (<year>2012</year>). <article-title>Fractional purification and bioconversion of hemicelluloses.</article-title> <source><italic>Biotechnol. Adv.</italic></source> <volume>30</volume> <fpage>879</fpage>&#x2013;<lpage>903</lpage>. <pub-id pub-id-type="doi">10.1016/j.biotechadv.2012.01.018</pub-id> <pub-id pub-id-type="pmid">22306329</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pold</surname> <given-names>G.</given-names></name> <name><surname>Billings</surname> <given-names>A. F.</given-names></name> <name><surname>Blanchard</surname> <given-names>J. L.</given-names></name> <name><surname>Burkhardt</surname> <given-names>D. B.</given-names></name> <name><surname>Frey</surname> <given-names>S. D.</given-names></name> <name><surname>Melillo</surname> <given-names>J. M.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Long-term warming alters carbohydrate degradation potential in temperate forest soils.</article-title> <source><italic>Appl. Environ. Microbiol.</italic></source> <volume>82</volume> <fpage>6518</fpage>&#x2013;<lpage>6530</lpage>. <pub-id pub-id-type="doi">10.1128/AEM.02012-16</pub-id> <pub-id pub-id-type="pmid">27590813</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pope</surname> <given-names>P. B.</given-names></name> <name><surname>Denman</surname> <given-names>S. E.</given-names></name> <name><surname>Jones</surname> <given-names>M.</given-names></name> <name><surname>Tringe</surname> <given-names>S. G.</given-names></name> <name><surname>Barry</surname> <given-names>K.</given-names></name> <name><surname>Malfatti</surname> <given-names>S. A.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Adaptation to herbivory by the <italic>Tammar wallaby</italic> includes bacterial and glycoside hydrolase profiles different from other herbivores.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>107</volume> <fpage>14793</fpage>&#x2013;<lpage>14798</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1005297107</pub-id> <pub-id pub-id-type="pmid">20668243</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pope</surname> <given-names>P. B.</given-names></name> <name><surname>Mackenzie</surname> <given-names>A. K.</given-names></name> <name><surname>Gregor</surname> <given-names>I.</given-names></name> <name><surname>Smith</surname> <given-names>W.</given-names></name> <name><surname>Sundset</surname> <given-names>M. A.</given-names></name> <name><surname>Mchardy</surname> <given-names>A. C.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Metagenomics of the Svalbard reindeer rumen microbiome reveals abundance of polysaccharide utilization loci.</article-title> <source><italic>PLOS ONE</italic></source> <volume>7</volume>:<issue>e38571</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0038571</pub-id> <pub-id pub-id-type="pmid">22701672</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ravachol</surname> <given-names>J.</given-names></name> <name><surname>Borne</surname> <given-names>R.</given-names></name> <name><surname>Tardif</surname> <given-names>C.</given-names></name> <name><surname>De Philip</surname> <given-names>P.</given-names></name> <name><surname>Fierobe</surname> <given-names>H. P.</given-names></name></person-group> (<year>2014</year>). <article-title>Characterization of all family-9 glycoside hydrolases synthesized by the cellulosome-producing bacterium <italic>Clostridium cellulolyticum</italic>.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>289</volume> <fpage>7335</fpage>&#x2013;<lpage>7348</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M113.545046</pub-id> <pub-id pub-id-type="pmid">24451379</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rossmassler</surname> <given-names>K.</given-names></name> <name><surname>Dietrich</surname> <given-names>C.</given-names></name> <name><surname>Thompson</surname> <given-names>C.</given-names></name> <name><surname>Mikaelyan</surname> <given-names>A.</given-names></name> <name><surname>Nonoh</surname> <given-names>J. O.</given-names></name> <name><surname>Scheffrahn</surname> <given-names>R. H.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Metagenomic analysis of the microbiota in the highly compartmented hindguts of six wood- or soil-feeding higher termites.</article-title> <source><italic>Microbiome</italic></source> <volume>3</volume>:<issue>56</issue>. <pub-id pub-id-type="doi">10.1186/s40168-015-0118-1</pub-id> <pub-id pub-id-type="pmid">26607965</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Simpson</surname> <given-names>J. T.</given-names></name> <name><surname>Wong</surname> <given-names>K.</given-names></name> <name><surname>Jackman</surname> <given-names>S. D.</given-names></name> <name><surname>Schein</surname> <given-names>J. E.</given-names></name> <name><surname>Jones</surname> <given-names>S. J.</given-names></name> <name><surname>Birol</surname> <given-names>I.</given-names></name></person-group> (<year>2009</year>). <article-title>ABySS: a parallel assembler for short read sequence data.</article-title> <source><italic>Genome Res.</italic></source> <volume>19</volume> <fpage>1117</fpage>&#x2013;<lpage>1123</lpage>. <pub-id pub-id-type="doi">10.1101/gr.089532.108</pub-id> <pub-id pub-id-type="pmid">19251739</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singhania</surname> <given-names>R. R.</given-names></name> <name><surname>Patel</surname> <given-names>A. K.</given-names></name> <name><surname>Sukumaran</surname> <given-names>R. K.</given-names></name> <name><surname>Larroche</surname> <given-names>C.</given-names></name> <name><surname>Pandey</surname> <given-names>A.</given-names></name></person-group> (<year>2013</year>). <article-title>Role and significance of beta-glucosidases in the hydrolysis of cellulose for bioethanol production.</article-title> <source><italic>Bioresour. Technol.</italic></source> <volume>127</volume> <fpage>500</fpage>&#x2013;<lpage>507</lpage>. <pub-id pub-id-type="doi">10.1016/j.biortech.2012.09.012</pub-id> <pub-id pub-id-type="pmid">23069613</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname> <given-names>S. P.</given-names></name> <name><surname>Bayer</surname> <given-names>E. A.</given-names></name> <name><surname>Czjzek</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>Continually emerging mechanistic complexity of the multi-enzyme cellulosome complex.</article-title> <source><italic>Curr. Opin. Struct. Biol.</italic></source> <volume>44</volume> <fpage>151</fpage>&#x2013;<lpage>160</lpage>. <pub-id pub-id-type="doi">10.1016/j.sbi.2017.03.009</pub-id> <pub-id pub-id-type="pmid">28390861</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>Y. H.</given-names></name> <name><surname>Lee</surname> <given-names>K. T.</given-names></name> <name><surname>Baek</surname> <given-names>J. Y.</given-names></name> <name><surname>Kim</surname> <given-names>M. J.</given-names></name> <name><surname>Kwon</surname> <given-names>M. R.</given-names></name> <name><surname>Kim</surname> <given-names>Y. J.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Isolation and characterization of a novel glycosyl hydrolase family 74 (GH74) cellulase from the black goat rumen metagenomic library.</article-title> <source><italic>Folia Microbiol.</italic></source> <volume>62</volume> <fpage>175</fpage>&#x2013;<lpage>181</lpage>. <pub-id pub-id-type="doi">10.1007/s12223-016-0486-3</pub-id> <pub-id pub-id-type="pmid">27866354</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Svartstr&#x00F6;m</surname> <given-names>O.</given-names></name> <name><surname>Alneberg</surname> <given-names>J.</given-names></name> <name><surname>Terrapon</surname> <given-names>N.</given-names></name> <name><surname>Lombard</surname> <given-names>V.</given-names></name> <name><surname>De Bruijn</surname> <given-names>I.</given-names></name> <name><surname>Malmsten</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Ninety-nine de novo assembled genomes from the moose (<italic>Alces alces</italic>) rumen microbiome provide new insights into microbial plant biomass degradation.</article-title> <source><italic>ISME J.</italic></source> <volume>11</volume> <fpage>2538</fpage>&#x2013;<lpage>2551</lpage>. <pub-id pub-id-type="doi">10.1038/ismej.2017.108</pub-id> <pub-id pub-id-type="pmid">28731473</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Temple</surname> <given-names>M. J.</given-names></name> <name><surname>Cuskin</surname> <given-names>F.</given-names></name> <name><surname>Basl&#x00E9;</surname> <given-names>A.</given-names></name> <name><surname>Hickey</surname> <given-names>N.</given-names></name> <name><surname>Speciale</surname> <given-names>G.</given-names></name> <name><surname>Williams</surname> <given-names>S. J.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>A Bacteroidetes locus dedicated to fungal 1,6-&#x03B2;-glucan degradation: unique substrate conformation drives specificity of the key endo-1,6-&#x03B2;-glucanase.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>292</volume> <fpage>10639</fpage>&#x2013;<lpage>10650</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M117.787606</pub-id> <pub-id pub-id-type="pmid">28461332</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Terrapon</surname> <given-names>N.</given-names></name> <name><surname>Lombard</surname> <given-names>V.</given-names></name> <name><surname>Gilbert</surname> <given-names>H. J.</given-names></name> <name><surname>Henrissat</surname> <given-names>B.</given-names></name></person-group> (<year>2015</year>). <article-title>Automatic prediction of polysaccharide utilization loci in Bacteroidetes species.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>647</fpage>&#x2013;<lpage>655</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu716</pub-id> <pub-id pub-id-type="pmid">25355788</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>van der Lelie</surname> <given-names>D.</given-names></name> <name><surname>Taghavi</surname> <given-names>S.</given-names></name> <name><surname>Mccorkle</surname> <given-names>S. M.</given-names></name> <name><surname>Li</surname> <given-names>L. L.</given-names></name> <name><surname>Malfatti</surname> <given-names>S. A.</given-names></name> <name><surname>Monteleone</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>The metagenome of an anaerobic microbial community decomposing poplar wood chips.</article-title> <source><italic>PLOS ONE</italic></source> <volume>7</volume>:<issue>e36740</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0036740</pub-id> <pub-id pub-id-type="pmid">22629327</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Venditto</surname> <given-names>I.</given-names></name> <name><surname>Luis</surname> <given-names>A. S.</given-names></name> <name><surname>Rydahl</surname> <given-names>M.</given-names></name> <name><surname>Schuckel</surname> <given-names>J.</given-names></name> <name><surname>Fernandes</surname> <given-names>V. O.</given-names></name> <name><surname>Vidal-Melgosa</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Complexity of the <italic>Ruminococcus flavefaciens</italic> cellulosome reflects an expansion in glycan recognition.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>113</volume> <fpage>7136</fpage>&#x2013;<lpage>7141</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1601558113</pub-id> <pub-id pub-id-type="pmid">27298375</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>K.</given-names></name> <name><surname>Pereira</surname> <given-names>G. V.</given-names></name> <name><surname>Cavalcante</surname> <given-names>J. J. V.</given-names></name> <name><surname>Zhang</surname> <given-names>M. L.</given-names></name> <name><surname>Mackie</surname> <given-names>R.</given-names></name> <name><surname>Cann</surname> <given-names>I.</given-names></name></person-group> (<year>2016</year>). <article-title><italic>Bacteroides intestinalis</italic> DSM 17393 a member of the human colonic microbiome, upregulates multiple endoxylanases during growth on xylan.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>6</volume>:<issue>34360</issue>. <pub-id pub-id-type="doi">10.1038/srep34360</pub-id> <pub-id pub-id-type="pmid">27681607</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Warnecke</surname> <given-names>F.</given-names></name> <name><surname>Luginbuhl</surname> <given-names>P.</given-names></name> <name><surname>Ivanova</surname> <given-names>N.</given-names></name> <name><surname>Ghassemian</surname> <given-names>M.</given-names></name> <name><surname>Richardson</surname> <given-names>T. H.</given-names></name> <name><surname>Stege</surname> <given-names>J. T.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Metagenomic and functional analysis of hindgut microbiota of a wood-feeding higher termite.</article-title> <source><italic>Nature</italic></source> <volume>450</volume> <fpage>560</fpage>&#x2013;<lpage>565</lpage>. <pub-id pub-id-type="doi">10.1038/nature06269</pub-id> <pub-id pub-id-type="pmid">18033299</pub-id></citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>White</surname> <given-names>B. A.</given-names></name> <name><surname>Lamed</surname> <given-names>R.</given-names></name> <name><surname>Bayer</surname> <given-names>E. A.</given-names></name> <name><surname>Flint</surname> <given-names>H. J.</given-names></name></person-group> (<year>2014</year>). <article-title>Biomass utilization by gut microbiomes.</article-title> <source><italic>Annu. Rev. Microbiol.</italic></source> <volume>68</volume> <fpage>279</fpage>&#x2013;<lpage>296</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-micro-092412-155618</pub-id> <pub-id pub-id-type="pmid">25002092</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wong</surname> <given-names>M. T.</given-names></name> <name><surname>Wang</surname> <given-names>W. J.</given-names></name> <name><surname>Lacourt</surname> <given-names>M.</given-names></name> <name><surname>Couturier</surname> <given-names>M.</given-names></name> <name><surname>Edwards</surname> <given-names>E. A.</given-names></name> <name><surname>Master</surname> <given-names>E. R.</given-names></name></person-group> (<year>2016</year>). <article-title>Substrate-driven convergence of the microbial community in lignocellulose-amended enrichments of gut microflora from the Canadian beaver (<italic>Castor canadensis</italic>) and North American moose (<italic>Alces americanus</italic>).</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>7</volume>:<issue>961</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2016.00961</pub-id> <pub-id pub-id-type="pmid">27446004</pub-id></citation></ref>
<ref id="B66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>M. L.</given-names></name> <name><surname>Chekan</surname> <given-names>J. R.</given-names></name> <name><surname>Dodd</surname> <given-names>D.</given-names></name> <name><surname>Hong</surname> <given-names>P. Y.</given-names></name> <name><surname>Radlinski</surname> <given-names>L.</given-names></name> <name><surname>Revindran</surname> <given-names>V.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Xylan utilization in human gut commensal bacteria is orchestrated by unique modular organization of polysaccharide-degrading enzymes.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>111</volume> <fpage>E3708</fpage>&#x2013;<lpage>E3717</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1406156111</pub-id> <pub-id pub-id-type="pmid">25136124</pub-id></citation></ref>
<ref id="B67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname> <given-names>L. F.</given-names></name> <name><surname>Wu</surname> <given-names>Q.</given-names></name> <name><surname>Dai</surname> <given-names>J. Y.</given-names></name> <name><surname>Zhang</surname> <given-names>S. N.</given-names></name> <name><surname>Wei</surname> <given-names>F. W.</given-names></name></person-group> (<year>2011</year>). <article-title>Evidence of cellulose metabolism by the giant panda gut microbiome.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>108</volume> <fpage>17714</fpage>&#x2013;<lpage>17719</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1017956108</pub-id> <pub-id pub-id-type="pmid">22006317</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="fn01"><label>1</label><p><ext-link ext-link-type="uri" xlink:href="http://www.cazy.org">www.cazy.org</ext-link></p></fn>
<fn id="fn02"><label>2</label><p><ext-link ext-link-type="uri" xlink:href="http://www.cazy.org/PULDB/">http://www.cazy.org/PULDB/</ext-link></p></fn>
</fn-group>
<glossary>
<title>Abbreviations</title>
<def-list id="DL1">
<def-item>
<term>AA</term>
<def>
<p>auxiliary activity</p>
</def>
</def-item>
<def-item>
<term>ABySS</term>
<def>
<p>Assembly By Short Sequences</p>
</def>
</def-item>
<def-item>
<term>CAZyme</term>
<def>
<p>carbohydrate-active enzyme</p>
</def>
</def-item>
<def-item>
<term>CBM</term>
<def>
<p>carbohydrate-binding module</p>
</def>
</def-item>
<def-item>
<term>CE</term>
<def>
<p>carbohydrate esterase</p>
</def>
</def-item>
<def-item>
<term>COD</term>
<def>
<p>chemical oxygen demand</p>
</def>
</def-item>
<def-item>
<term>DUF</term>
<def>
<p>domain of unknown function</p>
</def>
</def-item>
<def-item>
<term>ECF</term>
<def>
<p>extracytoplasmic function</p>
</def>
</def-item>
<def-item>
<term>GH</term>
<def>
<p>glycoside hydrolase</p>
</def>
</def-item>
<def-item>
<term>GT</term>
<def>
<p>glycosyltransferase</p>
</def>
</def-item>
<def-item>
<term>NCBI-NR</term>
<def>
<p>National Center for Biotechnology Information Non-redundant</p>
</def>
</def-item>
<def-item>
<term>NKD</term>
<def>
<p>normalized kmer depths</p>
</def>
</def-item>
<def-item>
<term>ORF</term>
<def>
<p>open-reading frame</p>
</def>
</def-item>
<def-item>
<term>PCA</term>
<def>
<p>principal component analysis</p>
</def>
</def-item>
<def-item>
<term>PUL</term>
<def>
<p>polysaccharide utilization locus</p>
</def>
</def-item>
<def-item>
<term>RPKM</term>
<def>
<p>reads per kilobase per million mapped reads</p>
</def>
</def-item>
</def-list>
</glossary>
</back>
</article>