<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="review-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2022.867007</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Marine Science</subject>
<subj-group>
<subject>Review</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Marine Microeukaryote Metatranscriptomics: Sample Processing and Bioinformatic Workflow Recommendations for Ecological Applications</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Cohen</surname>
<given-names>Natalie R.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/467405"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Alexander</surname>
<given-names>Harriet</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/38650"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Krinos</surname>
<given-names>Arianna I.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1470593"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hu</surname>
<given-names>Sarah K.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/583843"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lampe</surname>
<given-names>Robert H.</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/467952"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Skidaway Institute of Oceanography, University of Georgia</institution>, <addr-line>Savannah, GA</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Biology Department, Woods Hole Oceanographic Institution</institution>, <addr-line>Woods Hole, MA</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>MIT-WHOI Joint Program in Oceanography/Applied Ocean Science &amp; Engineering</institution>, <addr-line>Woods Hole, MA</addr-line>, <country>United States</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Marine Chemistry &amp; Geochemistry Department, Woods Hole Oceanographic Institution</institution>, <addr-line>Woods Hole, MA</addr-line>, <country>United States</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Integrative Oceanography Division, Scripps Institution of Oceanography, University of California San Diego</institution>, <addr-line>La Jolla, CA</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Angel Borja, Technological Center Expert in Marine and Food Innovation (AZTI), Spain</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Anders Lanz&#xe9;n, Technology Center Expert in Marine and Food Innovation (AZTI), Spain; Olivier Laroche, Cawthron Institute, New Zealand</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Natalie R. Cohen, <email xlink:href="mailto:cohen@uga.edu">cohen@uga.edu</email>; Harriet Alexander, <email xlink:href="mailto:halexander@whoi.edu">halexander@whoi.edu</email>; Arianna I. Krinos, <email xlink:href="mailto:akrinos@whoi.edu">akrinos@whoi.edu</email>
</p>
</fn>
<fn fn-type="other" id="fn002">
<p>This article was submitted to Marine Ecosystem Ecology, a section of the journal Frontiers in Marine Science</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>28</day>
<month>06</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>9</volume>
<elocation-id>867007</elocation-id>
<history>
<date date-type="received">
<day>31</day>
<month>01</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>03</day>
<month>05</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Cohen, Alexander, Krinos, Hu and Lampe</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Cohen, Alexander, Krinos, Hu and Lampe</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Microeukaryotes (protists) serve fundamental roles in the marine environment as contributors to biogeochemical nutrient cycling and ecosystem function. Their activities can be inferred through metatranscriptomic investigations, which provide a detailed view into cellular processes, chemical-biological interactions in the environment, and ecological relationships among taxonomic groups. Established workflows have been individually put forth describing biomass collection at sea, laboratory RNA extraction protocols, and bioinformatic processing and computational approaches. Here, we present a compilation of current practices and lessons learned in carrying out metatranscriptomics of marine pelagic protistan communities, highlighting effective strategies and tools used by practitioners over the past decade. We anticipate that these guidelines will serve as a roadmap for new marine scientists beginning in the realms of molecular biology and/or bioinformatics, and will equip readers with foundational principles needed to delve into protistan metatranscriptomics.</p>
</abstract>
<kwd-group>
<kwd>metatranscriptomics</kwd>
<kwd>phytoplankton</kwd>
<kwd>biological oceanography</kwd>
<kwd>microbial ecology</kwd>
<kwd>bioinformatics</kwd>
</kwd-group>
<contract-sponsor id="cn001">Division of Ocean Sciences<named-content content-type="fundref-id">10.13039/100000141</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">Division of Ocean Sciences<named-content content-type="fundref-id">10.13039/100000141</named-content>
</contract-sponsor>
<contract-sponsor id="cn003">University of Georgia<named-content content-type="fundref-id">10.13039/100007699</named-content>
</contract-sponsor>
<contract-sponsor id="cn004">U.S. Department of Energy<named-content content-type="fundref-id">10.13039/100000015</named-content>
</contract-sponsor>
<counts>
<fig-count count="1"/>
<table-count count="1"/>
<equation-count count="1"/>
<ref-count count="168"/>
<page-count count="18"/>
<word-count count="9813"/>
</counts>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Metatranscriptomics, or community gene expression profiling, offers a window into transcript pool composition within mixed microbial assemblages. This information can be used to infer taxon-specific physiology and elucidate links between cell metabolism and ecosystem function. When applied to marine systems, it may offer information on the biogeochemical and ecological roles of community members across ecosystems and environmental conditions. Marine metatranscriptomic studies to date have been conducted across spatial and temporal scales (e.g., <xref ref-type="bibr" rid="B147">Sun et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B12">Becker et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B34">Cohen et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B32">Coesel et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B58">Groussman et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B59">Harke et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B106">Muratore et&#xa0;al., 2022</xref>), and in concert with experimental incubations/microcosms in which key biological, chemical and/or physical parameters are manipulated (e.g., <xref ref-type="bibr" rid="B5">Alexander et&#xa0;al., 2015b</xref>; <xref ref-type="bibr" rid="B13">Bertrand et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B82">Lampe et&#xa0;al., 2018</xref>). Such metatranscriptomic investigations into marine protists have expanded our understanding of their nutrient physiology (<xref ref-type="bibr" rid="B4">Alexander et&#xa0;al., 2015a</xref>; <xref ref-type="bibr" rid="B113">Pearson et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B82">Lampe et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B25">Caputi et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B76">Kolody et&#xa0;al., 2019</xref>), nutritional modes (<xref ref-type="bibr" rid="B63">Hu et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B81">Lambert et&#xa0;al., 2021</xref>), coastal bloom dynamics (<xref ref-type="bibr" rid="B55">Gong et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B65">Ji et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B102">Metegnier et&#xa0;al., 2020</xref>), and contributions to ocean biogeochemistry (<xref ref-type="bibr" rid="B27">Carradec et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B34">Cohen et&#xa0;al., 2021</xref>).</p>
<p>Marine meta-omic studies, or community omic analyses performed in the environment, emerged in the 2000s with the first successful applications of shotgun DNA sequencing to microbial communities of the open ocean (<xref ref-type="bibr" rid="B156">Venter et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B126">Rusch et&#xa0;al., 2007</xref>). Early marine meta-omic studies relied upon high-throughput Sanger and second generation sequencing (454 pyrosequencing and SOLiD) platforms (<xref ref-type="bibr" rid="B156">Venter et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B126">Rusch et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B54">Gilbert et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B101">McCarren et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B146">Stewart et&#xa0;al., 2010</xref>), with the first metatranscriptomic study focusing on marine microeukaryotes released in 2012 (<xref ref-type="bibr" rid="B98">Marchetti et&#xa0;al., 2012</xref>). Pyrosequencing and SOLiD platforms were later replaced by Illumina bridge amplification-based sequencing as a result of unparalleled throughput, low error rates, and mid-range read lengths (~2 x 150 bp, paired-end) that were longer than SOLiD (~85 bp), but shorter than pyrosequencing and Sanger sequencing (&gt;400 bp) (<xref ref-type="bibr" rid="B92">Liu et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B8">Ambardar et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B162">Wilms, 2021</xref>). The price of sequencing has continued to decrease, while the degree of throughput has increased (<xref ref-type="bibr" rid="B104">Muir et&#xa0;al., 2016</xref>).</p>
<p>Marine metatranscriptomic initiatives have greatly benefited from the expansion of reference sequence libraries derived from laboratory isolates, such as the Marine Microbial Eukaryote Transcriptome Sequencing Project (MMETSP) (<xref ref-type="bibr" rid="B70">Keeling et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B26">Caron et&#xa0;al., 2017</xref>). The MMETSP database is composed of over 678 protistan transcriptomes from 405 unique strains (<xref ref-type="bibr" rid="B80">Krinos et&#xa0;al., 2021</xref>) and is widely used in current marine omic workflows (e.g., <xref ref-type="bibr" rid="B82">Lampe et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B76">Kolody et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B58">Groussman et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B79">Krinos et&#xa0;al., 2022</xref>). Oceanographic field expeditions such as <italic>Tara Oceans</italic> (<xref ref-type="bibr" rid="B27">Carradec et&#xa0;al., 2018</xref>) and <italic>bioGEOTRACES</italic> (<xref ref-type="bibr" rid="B15">Biller et&#xa0;al., 2018</xref>) are leveraging this database and other recently generated eukaryotic transcriptomes and genomes to uncover the taxonomic and functional roles of protists across ocean basins (<xref ref-type="bibr" rid="B27">Carradec et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B3">Alexander et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B161">Weissman et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B16">Blaxter et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B38">Delmont et&#xa0;al., 2022</xref>). These large field datasets describing the biographical and functional distribution of protists consist of sequence data, taxonomic and functional annotations, and contextualizing environmental metadata, and serve as invaluable community resources for researchers, students, and the public to use (<xref ref-type="bibr" rid="B15">Biller et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B27">Carradec et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B157">Villar et&#xa0;al., 2018</xref>).</p>
<p>The computational biology landscape is rapidly evolving as more efficient bioinformatic tools are developed and pipelines become more easily accessible. There has been a concerted community effort towards increasing reproducibility of data analysis by documenting protocols, archiving code and raw data, and making bioinformatic data products available to scientific audiences (<xref ref-type="bibr" rid="B129">Sandve et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B151">Tully et&#xa0;al., 2021</xref>). These resources are invaluable to new practitioners lacking formal training in molecular biology, computational biology, and/or statistics.</p>
<p>The interdisciplinary oceanographic community in particular would benefit from a comprehensive overview that emphasizes current approaches used to conduct microeukaryote metatranscriptomics. Here we present a compiled resource highlighting the latest practices and procedures, from sample collection to computational analysis. This effort complements other valuable environmental metatranscriptomic reviews that have been recently published (e.g., <xref ref-type="bibr" rid="B138">Shakya et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B105">Mukherjee and Reddy, 2020</xref>; <xref ref-type="bibr" rid="B166">Zhang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B162">Wilms, 2021</xref>; <xref ref-type="bibr" rid="B75">Kolody et&#xa0;al., 2022</xref>). We anticipate these recommendations will continue to evolve in the coming years, and encourage researchers to explore current sequencing platform options and bioinformatic workflows, and to consult updated versions of tool documentation before beginning new analyses. It may be particularly valuable for those with a microbial ecology and/or oceanography background to engage in discussions and apply principles learned from computational biologists (and vice versa) to effectively innovate across these subfields. Our descriptions of protocols, pipelines and tools are not intended to be technical accounts but rather a descriptive guide for beginning and returning practitioners, and readers are referred to individual publications for further details.</p>
</sec>
<sec id="s2">
<title>Sample Acquisition</title>
<sec id="s2_1">
<title>Collection and Filtration of Microbial Communities From Pelagic Seawater</title>
<p>The seawater volumes required to obtain suitable biomass for metatranscriptomic sequencing varies depending on the ecosystem. In offshore waters, volumes ~10 L or greater are generally recommended, while coastal systems supporting higher biomass require much lower volume (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). Sample volumes that are too low have been shown to skew relative abundances of 16S rRNA amplicon sequences, with volumes &gt;1 L generally encouraged (<xref ref-type="bibr" rid="B110">Padilla et&#xa0;al., 2015</xref>); this is likely also true for metatranscriptomic data, though has not yet been systematically verified.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Field processing procedures in recent marine microeukaryote metatranscriptomic studies.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Analysis</th>
<th valign="top" align="center">Region</th>
<th valign="top" align="center">Approx. Seawater volume (L)</th>
<th valign="top" align="center">Filtration type</th>
<th valign="top" align="center">Porosity (&#x3bc;m)</th>
<th valign="top" align="center">Filter type</th>
<th valign="top" align="center">RNA extraction</th>
<th valign="top" align="center">Library prep</th>
<th valign="top" align="center">Sequence platform</th>
<th valign="top" align="center">Reference</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Experimental</td>
<td valign="top" align="center">North Pacific Subtropical Gyre</td>
<td valign="top" align="center">60</td>
<td valign="top" align="center">Shipboard</td>
<td valign="top" align="center">5-200</td>
<td valign="top" align="center">Polycarbonate</td>
<td valign="top" align="center">Qiagen RNeasy Mini Kit</td>
<td valign="top" align="center">poly-A selection</td>
<td valign="top" align="center">Illumina HiSeq</td>
<td valign="top" align="center">
<xref ref-type="bibr" rid="B5">Alexander et&#xa0;al., 2015b</xref>
</td>
</tr>
<tr>
<td valign="top" align="left">Experimental</td>
<td valign="top" align="center">Ross Sea</td>
<td valign="top" align="center">0.45</td>
<td valign="top" align="center">Shipboard</td>
<td valign="top" align="center">&gt;0.2</td>
<td valign="top" align="center">Sterivex</td>
<td valign="top" align="center">Life Technologies TRIzol</td>
<td valign="top" align="center">rRNA depletion &amp; poly-A selection</td>
<td valign="top" align="center">Illumina HiSeq</td>
<td valign="top" align="center">
<xref ref-type="bibr" rid="B13">Bertrand et&#xa0;al., 2015</xref>
</td>
</tr>
<tr>
<td valign="top" align="left">Experimental</td>
<td valign="top" align="center">Northeast Pacific &amp; California Current</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">Shipboard</td>
<td valign="top" align="center">&gt;0.8</td>
<td valign="top" align="center">Polyethersulfone</td>
<td valign="top" align="center">Invitrogen ToTALLY RNA Kit</td>
<td valign="top" align="center">poly-A selection</td>
<td valign="top" align="center">Illumina HiSeq</td>    <td valign="top" align="center">
<xref ref-type="bibr" rid="B82">Lampe et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B33">Cohen et&#xa0;al., 2017</xref>
</td>
</tr>
<tr>
<td valign="top" align="left">Temporal</td>
<td valign="top" align="center">North Pacific Subtropical Gyre</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">Shipboard</td>
<td valign="top" align="center">0.2-100</td>
<td valign="top" align="center">Polycarbonate</td>
<td valign="top" align="center">Invitrogen ToTALLY RNA Kit</td>
<td valign="top" align="center">poly-A selection</td>
<td valign="top" align="center">Illumina NextSeq</td>    <td valign="top" align="center">
<xref ref-type="bibr" rid="B32">Coesel et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B58">Groussman et&#xa0;al., 2021</xref>
</td>
</tr>
<tr>
<td valign="top" align="left">Temporal</td>
<td valign="top" align="center">California Current</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">Environmental Sample Processor (ESP)</td>
<td valign="top" align="center">&gt;5</td>
<td valign="top" align="center">Polyvinylidene fluoride</td>
<td valign="top" align="center">Invitrogen mirVana miRNA Isolation kit</td>
<td valign="top" align="center">poly-A selection</td>
<td valign="top" align="center">Illumina HiSeq</td>    <td valign="top" align="center">
<xref ref-type="bibr" rid="B76">Kolody et&#xa0;al., 2019</xref>
</td>
</tr>
<tr>
<td valign="top" align="left">Spatial &amp; Temporal</td>
<td valign="top" align="center">North Pacific Subtropical Gyre</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">Shipboard</td>
<td valign="top" align="center">5-200</td>
<td valign="top" align="center">Polycarbonate</td>
<td valign="top" align="center">Qiagen RNeasy Mini Kit</td>
<td valign="top" align="center">poly-A selection</td>
<td valign="top" align="center">Illumina HiSeq</td>
<td valign="top" align="center">
<xref ref-type="bibr" rid="B59">Harke et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B12">Becker et&#xa0;al., 2021</xref>
</td>
</tr>
<tr>
<td valign="top" align="left">Spatial</td>
<td valign="top" align="center">Global</td>
<td valign="top" align="center">100 - 150,000</td>
<td valign="top" align="center">Shipboard &amp; plankton nets</td>
<td valign="top" align="center">0.8&#x2013;5, 5&#x2013;20, 20&#x2013;180, 180-2000</td>
<td valign="top" align="center">Polycarbonate</td>
<td valign="top" align="center">NucleoSpin RNA Midi kits</td>
<td valign="top" align="center">poly-A selection</td>
<td valign="top" align="center">Illumina HiSeq</td>
<td valign="top" align="center">
<xref ref-type="bibr" rid="B27">Carradec et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B25">Caputi et&#xa0;al., 2019</xref>
</td>
</tr>
<tr>
<td valign="top" align="left">Spatial</td>
<td valign="top" align="center">central Pacific Ocean</td>
<td valign="top" align="center">100-1,000</td>
<td valign="top" align="center">Underwater McLane pumps</td>
<td valign="top" align="center">3-51</td>
<td valign="top" align="center">Acrylic</td>
<td valign="top" align="center">Life Technologies TRIzol</td>
<td valign="top" align="center">rRNA depletion &amp; poly-A selection</td>
<td valign="top" align="center">Illumina HiSeq</td>    <td valign="top" align="center">
<xref ref-type="bibr" rid="B34">Cohen et&#xa0;al., 2021</xref>
</td>
</tr>
<tr>
<td valign="top" align="left">Spatial</td>
<td valign="top" align="center">San Pedro Ocean Time-series (coastal Southern California)</td>
<td valign="top" align="center">1.5 - 3.5</td>
<td valign="top" align="center">Shipboard</td>
<td valign="top" align="center">0.7-80</td>
<td valign="top" align="center">GF/F</td>
<td valign="top" align="center">Qiagen DNA/RNA AllPrep kit</td>
<td valign="top" align="center">poly-A selection</td>
<td valign="top" align="center">Illumina HiSeq</td>    <td valign="top" align="center">
<xref ref-type="bibr" rid="B63">Hu et&#xa0;al., 2018</xref>
</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="left">Spatial &amp; Temporal</td>
<td valign="top" rowspan="2" align="center">CalCOFI grid(Southern California Current)</td>
<td valign="top" rowspan="2" align="center">4</td>
<td valign="top" rowspan="2" align="center">Shipboard</td>
<td valign="top" rowspan="2" align="center">0.22</td>
<td valign="top" rowspan="2" align="center">Sterivex</td>
<td valign="top" rowspan="2" align="center">Machery-Nagel NucleoMag RNA kit</td>
<td valign="top" rowspan="2" align="center">rRNA depletion &amp; poly-A selection</td>
<td valign="top" rowspan="2" align="center">Illumina HiSeq &amp; NovaSeq</td>
<td valign="top" rowspan="2" align="center">
<xref ref-type="bibr" rid="B117">Rabines et&#xa0;al., 2020a</xref>, <xref ref-type="bibr" rid="B118">Rabines et al., 2020b</xref>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>The Analysis column indicates the type of metatranscriptional analysis performed, with &#x201c;Experimental&#x201d; representing incubations performed at sea, &#x201c;Temporal&#x201d; indicating surveys across time, and &#x201c;Spatial&#x201d; referring to studies across horizontal (latitudes, longitudes) or vertical (depth) zonations.  &#x201c;Shipboard&#x201d; filtration type refers to either vacuum or peristaltic pump devices used in shipboard laboratories directly following seawater collection.</p>
</table-wrap-foot>
</table-wrap>
<p>While larger seawater volumes are ideal for the collection of sufficient biomass, the logistics of processing samples in the field (e.g., shipboard) must also be considered. Nucleic acid sample collection from seawater requires rapid filtration and preservation (<xref ref-type="bibr" rid="B49">Frias-Lopez et&#xa0;al., 2008</xref>), otherwise RNA degradation or unintended changes in the RNA pool may occur (<xref ref-type="bibr" rid="B51">Gallego Romero et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B75">Kolody et&#xa0;al., 2022</xref>), and cells may metabolically respond to changes in light and temperature during long collection times. Peristaltic pumps in conjunction with 47-142&#xa0;mm in-line filter manifolds or Sterivex (Millipore) filters enable large volumes to be filtered rapidly and effectively (Table&#xa0;1). Notably, filters may clog as biomass accumulates, especially for small filter size fractions, impacting filter effectiveness and sample quality. The filtration time may be reduced by splitting volumes across multiple filters. It is important to consider pump pressure levels during the filtration process, as high pressure could rupture cells before preservation, leading to RNA loss.</p>
<p>Increasingly, underwater battery-operated McLane filtration pumps (<xref ref-type="bibr" rid="B127">Saito et&#xa0;al., 2014</xref>), Lagrangian-like Environmental Sample Processors (<xref ref-type="bibr" rid="B135">Scholin et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B76">Kolody et&#xa0;al., 2019</xref>), Autonomous Underwater Vehicles (<xref ref-type="bibr" rid="B19">Breier et&#xa0;al., 2020</xref>), and other sensors (<xref ref-type="bibr" rid="B109">Ottesen, 2016</xref>) capable of <italic>in situ</italic> filtration at ambient temperature and pressure are being utilized. High-volume pumping mechanisms offered by McLane pumps and AUVs in particular are ideal for concentrating large amounts of biomass. These <italic>in situ</italic> approaches are useful for deep sea sampling, where depressurization during traditional seawater collection and processing may result in inaccurate assessments of community dynamics (<xref ref-type="bibr" rid="B44">Edgcomb et&#xa0;al., 2016</xref>). Filtration time is likely still important to consider in study designs using underwater pumps, as long filtrations may result in an integrated metatranscriptomic signal over time as biomass aggregates. With any sampling system used, the time needed to recover filters and preserve samples should be minimized (&lt; 1 hour, if possible) to prevent RNA degradation.</p>
<p>Typical filter fraction size ranges for marine protists span 0.8 - 200 &#x3bc;m (<xref ref-type="bibr" rid="B115">Pesant et&#xa0;al., 2015</xref>) and generally align with the plankton size fractions (<xref ref-type="bibr" rid="B107">Omori and Ikeda, 1992</xref>). In some studies, no upper bound size threshold is used, and multicellular eukaryotes are included in the analysis (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). It&#x2019;s important to note that the specific size fraction used to capture protists will vary depending on the group of organisms intended to collect, with characterized smaller protists such as the green algae <italic>Ostreococcus</italic> approximately ~1 &#x3bc;m in diameter (<xref ref-type="bibr" rid="B39">Derelle et&#xa0;al., 2006</xref>), and members of the Foraminifera on the larger end of the size spectrum at &gt;150 &#x3bc;m (<xref ref-type="bibr" rid="B93">Lo Giudice Cappelli and Austin, 2019</xref>). Size-fractionated filtering can be an advantageous strategy for capturing multiple distinct plankton size classes (<xref ref-type="bibr" rid="B157">Villar et&#xa0;al., 2018</xref>), in which filter membranes are either stacked and separated by backing filters, or arranged serially in separate filter manifolds. This approach may be valuable in concentrating biomass from specific groups of interest, but is imperfect as filters aggregate biomass especially with large seawater volumes, and smaller than intended particles may be captured on filters (<xref ref-type="bibr" rid="B34">Cohen et&#xa0;al., 2021</xref>). It is furthermore difficult to directly compare gene expression across these distinct size fractions, though may be approximated using biomass normalizations (<xref ref-type="bibr" rid="B42">Dupont et&#xa0;al., 2015</xref>).</p>
<p>Filter membranes made of polyethersulfone or polycarbonate are commonly used, and allow sufficient resuspension of material during the RNA extraction procedure (Table&#xa0;1). RNA rapidly degrades, and instant RNA stabilization achieved <italic>via</italic> flash freezing with liquid nitrogen is recommended prior to storage at -80&#xb0;C (<xref ref-type="bibr" rid="B7">Alvarez et&#xa0;al., 2015</xref>). If -80&#xb0;C storage is not available on ships, RNA can be stored up to 1 week at room temperature, 1 month at 4&#xb0;C, or indefinitely at -20&#xb0;C using the RNAlater (Invitrogen) preservative reagent. However, RNAlater may result in inadvertent physiological changes in the RNA pool (<xref ref-type="bibr" rid="B111">Passow et&#xa0;al., 2019</xref>). Care should be taken in evaluating available storage mechanisms in the field and the potential risks of preservatives.</p>
<p>Biological replicates are generally required to determine statistical differences in gene expression and physiology across treatments or spatial zonation, but logistic constraints onboard research vessels often prevent repeat collection of seawater. In addition, microbial communities at a given location, depth, and time of day can rapidly shift due to the heterogeneous and highly dynamic nature of the ocean environment, complicating efforts to obtain replicated snapshots of community composition and function. This can however represent natural biological variability in a system, and samples collected from the same location may indeed serve as replicates, depending on the study objectives and spatial scope. Researchers may instead prioritize additional sampling depths, locations, or time points to capture transcript pools with high resolution. Samples collected from similar latitudes and depths may reflect similar biological properties, thus demonstrating oceanographic consistency across space and time (<xref ref-type="bibr" rid="B28">Cerdan-Garcia et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B61">Hogle et&#xa0;al., 2021</xref>). High frequency sampling may identify metabolic trends that either change on a diel cycle (e.g., energy partitioning), or are unaffected by temporal dynamics (e.g., chronic nutrient stress). In particular, there is significant diel periodicity in metabolic processes carried out by protists in surface waters (<xref ref-type="bibr" rid="B76">Kolody et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B12">Becker et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B58">Groussman et&#xa0;al., 2021</xref>), and time of day should therefore be considered in sampling designs.</p>
</sec>
<sec id="s2_2">
<title>RNA Extraction Procedure</title>
<p>RNA extractions from microeukaryotic cells collected onto filters may be performed using popular commercially available kits (Table&#xa0;1). Common modifications include the addition of silica or zirconia beads to lysis buffer and bead-beating to assist with the physical disruption of cell walls during the RNA extraction, which is useful for hard-shelled protists. Total RNA yields and quality may be estimated using a Nanodrop spectrophotometer (Thermo Scientific), though a Qubit fluorometer (Invitrogen), Bioanalyzer (Agilent) or Tapestation (Agilent) will produce more accurate estimates of RNA concentration, especially at lower concentrations (<xref ref-type="bibr" rid="B64">Hussing et&#xa0;al., 2018</xref>). The RiboGreen (Promega) fluorescent nucleic acid stain is another suitable option for RNA quantification with high sensitivity (<xref ref-type="bibr" rid="B67">Jones et&#xa0;al., 1998</xref>). The Bioanalyzer and Tapestation will additionally provide information on RNA quality, including RNA integrity number (RIN) scores, which reflect degree of RNA degradation. High RIN scores represent high quality RNA (<xref ref-type="bibr" rid="B136">Schroeder et&#xa0;al., 2006</xref>). RIN scores above 7 are encouraged for Illumina library preparation, although low RNA yields and partial degradation that occurs during the seawater filtration process may make it difficult to reach high RIN scores (<xref ref-type="bibr" rid="B2">Alberti et&#xa0;al., 2017</xref>). However, certain protocols allow modifications for low RIN RNA to be used in the library preparation process.</p>
<p>In addition to relative transcript abundances obtained through metatranscriptomic sequencing, approaches have been developed to estimate transcript copies L<sup>-1</sup> to more directly relate metabolic information to biogeochemical measurements, and to circumvent limitations inherent to relative analyses (<xref ref-type="bibr" rid="B131">Satinsky et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B53">Gifford et&#xa0;al., 2014</xref>). Custom-built plasmids or commercially available mRNA internal standards (e.g., ERCC Spike-In [Thermo Scientific], ArrayControl RNA Spikes [Invitrogen], Sequins [Garvan Institute of Medical Research]) can be added to lysis buffer during the initial stages of the RNA extraction, and will reflect losses during the laboratory procedure. Assuming the exact volume filtered is known, the number of added mRNA standard copies sequenced can be used to estimate transcript concentration in the sample (<xref ref-type="bibr" rid="B131">Satinsky et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B53">Gifford et&#xa0;al., 2014</xref>; see below). Increasing the number of distinct mRNA standards spiked will strengthen the copies-to-sequences estimation. An appropriate rule of thumb is to add the mRNA spike concentration at a target ratio of ~1% the total RNA pool (<xref ref-type="bibr" rid="B53">Gifford et&#xa0;al., 2014</xref>). Note that the number of RNA copies per cell may differ by organism, with larger cells generally containing higher RNA concentrations (<xref ref-type="bibr" rid="B99">Marguerat and B&#xe4;hler, 2012</xref>). Transcript pools furthermore fluctuate over the course of a day, with phytoplankton groups under different diel transcriptional regulation (<xref ref-type="bibr" rid="B58">Groussman et&#xa0;al., 2021</xref>). These factors may contribute to the copies L<sup>-1</sup> estimate among taxa not fully scaling with absolute cell densities. It is recommended to collect direct information on biomass, including pigments and/or cell counts (flow cytometry, fluid imaging, microscopy, etc), to provide environmental context for transcript-derived copies L<sup>-1</sup>.</p>
</sec>
<sec id="s2_3">
<title>Sequencing Platforms &amp; Library Preparation</title>
<p>Popular and cost effective second generation sequencing technology platforms for metatranscriptomics include Illumina Miseq and Hiseq (Table&#xa0;1), with these older platforms being replaced by the newer and more efficient Nextseq and Novaseq. Novaseq currently offers the greatest output (~20 billion reads per run), with the Miseq platform still offering the longest read lengths (2 x 300 base pairs) but Novaseq not far behind with 2 x 250 base pairs possible using the Novaseq SP flow cell.</p>
<p>For mRNA-Seq studies performed with the Illumina platform, RNA is converted to cDNA and fragmented as part of the sequencing library preparation process. It is important to ensure that the sequencing library preparation method chosen enriches for protein-coding RNA, or messenger RNA (mRNA), because the majority of the total RNA pool in eukaryotes consists of ribosomal RNA (rRNA) (<xref ref-type="bibr" rid="B23">Bush et&#xa0;al., 2017</xref>). Two approaches may be used: rRNA depletion, in which rRNA is removed and non-coding RNA and mRNA remain, and polyadenylated RNA (poly-A) selection, in which mRNA containing poly-A tails (characteristic of eukaryotic mRNA) is selected along with other poly-A-containing non-coding RNA (<xref ref-type="bibr" rid="B37">Cui et&#xa0;al., 2010</xref>). The methods differ in resulting RNA pools, coverage, and quantitative accuracy (<xref ref-type="bibr" rid="B167">Zhao et&#xa0;al., 2018</xref>), with poly-A selection yielding more protein-coding sequences at a given sequencing depth (<xref ref-type="bibr" rid="B29">Chen et&#xa0;al., 2020</xref>). A key difference is that rRNA depletion will select for mRNA from both microbial prokaryotes and eukaryotes, while poly-A selection will be biased towards eukaryotes containing poly-adenylated mRNA. Additionally, rRNA depletion better recovers important eukaryotic organelle transcripts without selection bias. These non-target sequences may provide valuable information especially regarding plastid expression (<xref ref-type="bibr" rid="B141">Smith, 2013</xref>), such as Rubisco and cytochrome oxidase, which are of biogeochemical interest (<xref ref-type="bibr" rid="B42">Dupont et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B75">Kolody et&#xa0;al., 2022</xref>). It is unclear whether these non-target sequences are truly able to be used comparatively across samples or whether the level of non-poly-A RNA contamination differs depending on sample matrix or other factors. Both rRNA depletion and poly-A selection are commonly used in marine microeukaryote studies (Table&#xa0;1), and should be selected based on specific scientific goals and interests. Note that when analyzing metatranscriptomes processed using rRNA depletion, recovery of eukaryotes might be low, and prokaryotes may constitute the majority of the sequence library. Popular methods for rRNA depletion include Ribo-Zero (Illumina) and riboPOOLs, which are available in custom mixtures to reduce rRNA from phylogenetically diverse species (siTOOLS Biotech).</p>
<p>Approximately 0.1 - 1 &#x3bc;g of total RNA is suggested for standard whole transcriptome library preparation prior to second generation sequencing using the TruSeq Stranded mRNA library prep kit (Illumina), and as low as 25 ng using the newer Stranded mRNA Prep kit (Illumina). Both of these kits capture poly-adenylated mRNA. In many oligotrophic regions, especially deeper in the water column, obtaining high concentrations of RNA is not feasible given sampling and experimental design limitations. Specialized cDNA library preparation kits are compatible with input material as low as 250 pg total RNA in which additional linear amplification cycles are performed, such as with the SMART-Seq v4 Ultra Low Input RNA Kit (Clontech). Although more expensive, the SMART-Seq v4 approach produces similar results to those obtained using larger RNA input (<xref ref-type="bibr" rid="B143">Song et&#xa0;al., 2018</xref>) and is a suitable option for low RNA yields from oligotrophic or otherwise low biomass regions of the ocean. Intriguingly, the SMART-Seq protocol appears to capture a non-negligible pool of prokaryotic transcripts despite enrichment for poly-A RNA, although this has not been explicitly tested across library preparation kit methods; a systematic comparison using natural marine communities will be important for determining whether library preparation biases are occurring. Due to these overt differences in resulting sequence libraries between library preparation methods and mRNA enrichment strategies, it is not recommended to mix and match methods in a single experimental dataset.</p>
<p>An alternative aquatic metatranscriptomic approach is sequencing the entire RNA pool. This method provides valuable information on transcriptionally active taxonomic community members through dominant rRNA reads, with limited insights into the functional composition gained through the abundant mRNA captured (<xref ref-type="bibr" rid="B101">McCarren et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B140">Shi et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B10">Baker et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B85">Lanz&#xe9;n et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B165">Wu et&#xa0;al., 2013</xref>). This method is therefore most appropriate when functional characterization is of secondary importance to taxonomic composition.</p>
<p>Third generation sequencing platforms are gaining in popularity and hold great potential for long read metatranscriptomic sequencing with high accuracy and throughput, without PCR amplification bias or short read assembly challenges (<xref ref-type="bibr" rid="B71">Kerkhof, 2021</xref>). In contrast to the Illumina library preparation process in which RNA is required to be converted to cDNA, third generation sequencing technology can sequence RNA molecules directly. These applications to the marine environment are nascent and still being developed, with current limitations including relatively high read error rate and inter-run variability (<xref ref-type="bibr" rid="B137">Semmouri et&#xa0;al., 2020</xref>). However, preliminary findings show successful application to marine pelagic zooplankton communities, with high predicted protein content (<xref ref-type="bibr" rid="B137">Semmouri et&#xa0;al., 2020</xref>). Metatranscriptomes generated using third generation sequencing platforms will have the added benefit of detecting long 18S rRNA molecules in the sequenced RNA pool, providing a direct assessment of community composition alongside predicted proteins (<xref ref-type="bibr" rid="B137">Semmouri et&#xa0;al., 2020</xref>).</p>
</sec>
</sec>
<sec id="s3">
<title>Bioinformatic Pipeline Recommendations</title>
<p>After RNA is collected from field sites, extracted in the laboratory, and sequenced, the bioinformatic process begins (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). Oceanographic research publications are generally required to include field and lab-based methods in enough detail to enable reproducibility. Unfortunately, details regarding bioinformatic tool usage are not always included in study methods, and it can therefore be difficult for others to replicate analyses and determine how each step of the bioinformatic pipeline influences downstream biological interpretations. In addition, many tools and pipelines are not created with microeukaryotes in mind, and special parameters, settings, or considerations may need to be applied. Typically tools are chosen for a specific research question or purpose, meaning that one researcher&#x2019;s approach may not be suitable in other circumstances. Therefore, disclosing details and reasoning for performing these critical computational steps will help the broader community evaluate the method. It is especially helpful to include a short justification for the method chosen in study descriptions. This transparency will reduce the steep learning curves in computational biology by encouraging such consistent practices and open data sharing policies.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Flow chart of a metranscriptomic pipeline designed for marine microeukaryotes (right). Visual depiction of the main workflow steps, including cell extraction, sequencing, assembly, read mapping, and annotations (left). Example annotations are shown for three phytoplankton taxa (<xref ref-type="bibr" rid="B45">Ellis et&#xa0;al., 2017</xref>, <xref ref-type="bibr" rid="B33">Cohen et&#xa0;al., 2017</xref>, <xref ref-type="bibr" rid="B164">Wu et&#xa0;al., 2019</xref>, <xref ref-type="bibr" rid="B120">Rao, 2020</xref>). Note that many predicted proteins do not correspond to a known functional annotation. Example graphics and statistical approaches used to investigate metatranscriptomic output (bottom): Ordinations may be created using orthologous groups or functional annotations aggregated to the taxonomic level of interest. Heatmaps are constructed using normalized gene expression and can be subset to include biostatistically or biologically relevant genes. Heatmaps and ordinations are useful in identifying similarities among sampling groups. 2D section plots show differences in the relative abundance of gene expression across space (or time), highlighting shifts in ecological strategies. MA plots are created using normalized gene expression corresponding to taxonomic/functional annotations or orthologous groups, and are useful in assessing differential expression between pairwise experimental treatments or groupings. Networks are built using normalized gene expression corresponding to taxonomic/functional annotations or orthologous groups, and highlight co-occurring genes. They can be paired with metadata to identify groups of genes correlated with environmental parameters. Stacked barplots represent the relative community composition across samples, and can be produced using raw reads or normalized read counts (e.g., TPM) associated with contigs and/or predicted proteins.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-09-867007-g001.tif"/>
</fig>
<p>There has been a concerted effort in the biological data science community to adhere to FAIR (findable, accessible, interoperable, reusable) principles in order to improve reproducibility (<xref ref-type="bibr" rid="B52">Garcia et&#xa0;al., 2020</xref>), and the oceanographic community is beginning to benefit from the adoption of these practices. In addition to fostering a culture of open data and enabling broader usage of data products, there is tremendous value in making computational code, pipelines, protocols and intermediate products available to new data scientists that are beginning their bioinformatic pursuits.</p>
<p>One avenue for this is sharing analysis and visualization code accompanying published studies on public servers, such as <italic>GitHub</italic> or personal websites, which is increasingly done by marine microbial ecologists. Code is most useful when annotated to facilitate readability, which is effectively done using rendered reports (Markdown) with <italic>RStudio</italic> and <italic>Jupyter Notebook</italic>. Tools such as <italic>Binder</italic> allow users to work in exact coding environments used to produce data, including loaded pre-requisites and input variables accessible through a website. Documentation in the form of personal blogs that accompany analyses are ideal tools for conveying underlying concepts and detailed thought processes going into analytical decisions, which are valuable educational resources for others in the microbial ecology field (e.g., <italic>polarmicrobes.org/antarctica-blog</italic>, <italic>merenlab.org/posts</italic>). Raw sequences are typically required to be uploaded to public repositories before publication, such as the National Center for Biotechnology Information (NCBI) Sequence Read Archive (SRA), and intermediate data files including assemblies, annotations, and read counts can similarly be shared on open-access repositories (e.g., Zenodo). In addition to these avenues for sharing computational resources, laboratory protocols can be archived on websites such as <italic>protocols.io</italic>, which brings new practitioners up to speed with technical logistics involved in sample acquisition and helps standardize sample processing.</p>
<p>Below we describe a typical metatranscriptomic bioinformatic analysis and provide an example workflow using second generation sequencing (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref> and <xref ref-type="supplementary-material" rid="SF1">
<bold>Supplementary Figure&#xa0;1</bold>
</xref>). We encourage new users to consult existing code, tutorials, and blog posts compiled by other data scientists to gain familiarity with these computational steps. Ideally, these new users will share code once their analysis is complete, and the oceanographic community as a whole will benefit from the incorporation of these open data science practices.</p>
<sec id="s3_1">
<title>Compute Environment</title>
<p>Once raw sequences are generated, a series of bioinformatic steps are performed to assemble reads into transcripts <italic>de novo</italic>, quantify gene expression, and assign taxonomic and functional annotations. These steps may be performed individually or as part of an automated workflow in a Linux-based environment, or within a GUI web-based platform (e.g., <italic>Galaxy</italic>). It is recommended to store all raw files in read-only format in more than one place. Many of the steps in metatranscriptomic analyses are computationally intensive and cannot be performed on the typical laptop or workstation. As such, access to a high performance computing cluster through an institution or national resource (e.g. XSEDE) or access to cloud based compute resources (e.g. Azure, Amazon Web Services) is often necessary. Broadly, the steps of assembly, quantification, and annotation require access to resources, with typical smaller scale projects benefiting from 25-40 cores and 250-400 Gb of RAM, and needs scaling with the size of the dataset and choice of tools.</p>
</sec>
<sec id="s3_2">
<title>Quality Control</title>
<p>Raw reads are trimmed to remove poor quality base pairs common on the ends of Illumina reads, and to clip off sequence adapters. Numerous tools are available for trimming sequences, including <italic>Trimmomatic</italic> (<xref ref-type="bibr" rid="B17">Bolger et&#xa0;al., 2014</xref>), <italic>FASTX-Toolkit</italic> (hannonlab.cshl.edu/fastx_toolkit), or <italic>cutadapt</italic> (<xref ref-type="bibr" rid="B100">Martin, 2011</xref>), with these tools universally compatible with Illumina sequences. The quality of sequences pre- and post-trimming can be evaluated using tools such as <italic>FastQC</italic> (<uri xlink:href="https://www.bioinformatics.babraham.ac.uk/projects/fastqc">www.bioinformatics.babraham.ac.uk/projects/fastqc</uri>), or evaluated in batch with <italic>MultiQC</italic> (github.com/ewels/MultiQC), which will additionally summarize total number of reads among other useful metrics. While often an aggressive approach to trimming has been taken, work in single species transcriptomes suggests that a less stringent trimming of only those reads whose Phred sequence quality score &lt;2 or &lt;5 is sufficient and optimal across a variety of downstream metrics (<xref ref-type="bibr" rid="B95">MacManes, 2014</xref>).</p>
</sec>
<sec id="s3_3">
<title>Removal of Contaminants and/or Spiked Sequences</title>
<p>Non-poly-A RNA or organelle mRNA may have been sequenced along with nuclear mRNA, especially if rRNA depletion was used as the library preparation. Ribosomal RNA is not included in most reference databases, and alignments of these sequences will be patchy and inconsistent. These sequences can be removed prior to the analysis by alignment against reference rRNA sequences using tools such as <italic>riboPicker</italic> (<uri xlink:href="https://ribopicker.sourceforge.net">ribopicker.sourceforge.net</uri>), <italic>SortMeRNA</italic> (<xref ref-type="bibr" rid="B77">Kopylova et&#xa0;al., 2012</xref>), or <italic>BBDuk</italic> within the BBTools suite (<uri xlink:href="https://jgi.doe.gov/data-and-tools/bbtools">jgi.doe.gov/data-and-tools/bbtools</uri>). In addition, if used, mRNA spike sequences will be useful for copies L<sup>-1</sup> quantification, but do not need to be included in the downstream analysis. Non-target sequences can be removed by aligning against a spike reference fasta file, for example with <italic>BBMap</italic> <uri xlink:href="https://sourceforge.net/projects/bbmap/">sourceforge.net/projects/bbmap/</uri>.</p>
</sec>
<sec id="s3_4">
<title>Assemblies</title>
<p>Taxonomic and functional interpretations of RNA-Seq data could theoretically be achieved by aligning reads to annotated eukaryotic genomes and metagenomes, however, we lack genomic representatives that cover the extreme diversity found in the natural environment, and <italic>de novo</italic> assemblies are commonly used instead (<xref ref-type="bibr" rid="B86">Lau et&#xa0;al., 2018</xref>). The <italic>de novo</italic> assembly process relies on elongating individual short reads into contiguous sequences (contigs) using overlapping sequences of length <italic>k</italic>, or k-mers (<xref ref-type="bibr" rid="B123">Robertson et&#xa0;al., 2010</xref>). Popular assemblers for eukaryotic transcriptomes include <italic>Trinity</italic> (<xref ref-type="bibr" rid="B57">Grabherr et&#xa0;al., 2011</xref>), <italic>Trans-ABySS</italic> (<xref ref-type="bibr" rid="B123">Robertson et&#xa0;al., 2010</xref>), <italic>rnaSPAdes</italic> (<xref ref-type="bibr" rid="B22">Bushmanova et&#xa0;al., 2019</xref>), <italic>IDBA-Tran</italic> (<xref ref-type="bibr" rid="B114">Peng et&#xa0;al., 2013</xref>), and <italic>MEGAHIT</italic> (<xref ref-type="bibr" rid="B90">Li et&#xa0;al., 2015</xref>), among others (<xref ref-type="bibr" rid="B108">Ortiz et&#xa0;al., 2021</xref>), which differ in their algorithmic basis, relative performance, and the number and length of contigs generated. Although these assemblers were designed for metagenomics (<italic>MEGAHIT</italic>) or transcriptomics (<italic>Trans-ABySS, Trinity, rnaSPAdes, IDBA-Tran</italic>), they are largely compatible with environmental metatranscriptomes (<xref ref-type="bibr" rid="B86">Lau et&#xa0;al., 2018</xref>) and eukaryotic sequences (<xref ref-type="bibr" rid="B108">Ortiz et&#xa0;al., 2021</xref>), with <italic>rnaSPAdes</italic> and <italic>Trinity</italic> performing particularly well for marine microeukaryotic communities in terms of the number of high quality and annotatable contigs produced (<xref ref-type="bibr" rid="B79">Krinos et&#xa0;al., 2022</xref>).</p>
<p>Quality-trimmed reads should be used as input during the assembly process, with some assemblers capable of handling multiple pairs of reads (co-assembling), depending on computational constraints. For large datasets, individual assemblies can be generated from each set of reads, which could then be merged together and de-replicated by clustering at high sequence similarity (95-100%) using tools such as <italic>cd-hit</italic> (<xref ref-type="bibr" rid="B89">Li and Godzik, 2006</xref>) or <italic>MMseqs2</italic> (<xref ref-type="bibr" rid="B145">Steinegger and S&#xf6;ding, 2017</xref>; <xref ref-type="bibr" rid="B79">Krinos et&#xa0;al., 2022</xref>). Broadly, assembly metrics (e.g. percent mapped reads) improve with a multi-assembler approach in which assembly output from different tools are combined (<xref ref-type="bibr" rid="B108">Ortiz et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B79">Krinos et&#xa0;al., 2022</xref>). In this case, the resulting assembly will contain contigs generated from all communities sampled and different assembler algorithms used. <italic>De novo</italic> assembling with metatranscriptomic reads from closely related taxa may inadvertently introduce spurious and/or chimeric contigs, in which reads from different transcripts are combined and would not reflect true protein pools. Certain transcriptomic assemblers are better at controlling chimeric contigs than others, with <italic>Trans-ABySS</italic> and <italic>IDBA-Tran</italic> stable across a range of k-mers (<xref ref-type="bibr" rid="B160">Wang and Gribskov, 2016</xref>).</p>
<p>Third generation sequencing reads can be assembled to produce high quality, long contigs using <italic>de novo</italic> assemblers such as <italic>metaFlye</italic>, which take into consideration challenges specific to long reads, such as uneven coverage among species sequenced (<xref ref-type="bibr" rid="B74">Kolmogorov et&#xa0;al., 2020</xref>). The informatic methodology will need to be reconsidered as third generation sequencing becomes more commonly applied and directly compared to older, short read-based studies. In particular, hybrid assemblies combining short and long reads benefit from the throughput/low error rates of short sequences and added structural information provided by long sequences (<xref ref-type="bibr" rid="B116">Prjibelski et&#xa0;al., 2020</xref>). This capability has been recently built into the <italic>MUFFIN</italic> metagenomic workflow (<xref ref-type="bibr" rid="B152">van Damme et&#xa0;al., 2021</xref>) and the <italic>rnaSPAdes</italic> assembler (<xref ref-type="bibr" rid="B116">Prjibelski et&#xa0;al., 2020</xref>), with the <italic>rnaSPAdes</italic> hybrid approach successfully applied to marine phytoplankton in culture (<xref ref-type="bibr" rid="B144">Sperfeld et&#xa0;al., 2021</xref>).</p>
</sec>
<sec id="s3_5">
<title>Read Mapping</title>
<p>Trimmed reads can be aligned to the de-replicated, final assembly to estimate gene expression across samples. Alternatively, reads may be aligned to assemblies generated from individual samples, although relative comparisons across samples could then only be made at the fold change or gene ratio level. When aiming to draw direct comparisons in community composition and gene expression across a dataset, it is simplest to align to the same reference assembly, so that reads are allowed to align to the closest possible contig match, rather than only those contigs assembled from an individual sample.</p>
<p>Read mapping can be performed using traditional alignment tools such as <italic>Bowtie2</italic> (<xref ref-type="bibr" rid="B84">Langmead and Salzberg, 2012</xref>) or <italic>BWA</italic> (<xref ref-type="bibr" rid="B88">Li and Durbin, 2009</xref>) which map short reads against a reference transcriptome or genome. Newer alignment options include <italic>Salmon</italic> (<xref ref-type="bibr" rid="B112">Patro et&#xa0;al., 2017</xref>) and <italic>Kallisto</italic> (<xref ref-type="bibr" rid="B18">Bray et&#xa0;al., 2016</xref>) which use quasi-mapping and pseudo-alignment approaches, respectively, rather than base-to-base alignments, performing rapid alignments while preserving high sensitivity and accuracy.</p>
<p>In addition to mapping reads to the <italic>de novo</italic> assembly, another option is to map metatranscriptomic reads to transcriptome and genome references directly, for example the MMETSP database. This method could identify community members present that closely match cultured species or strains of interest without the effort of <italic>de novo</italic> assembling, and can capture organisms that failed to assemble into high quality contigs (<xref ref-type="bibr" rid="B4">Alexander et&#xa0;al., 2015a</xref>; <xref ref-type="bibr" rid="B102">Metegnier et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B59">Harke et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B106">Muratore et&#xa0;al., 2022</xref>). However, is it important to note that current reference transcriptome databases are limited relative to the tremendous taxonomic diversity of eukaryotes in seawater (<xref ref-type="bibr" rid="B40">de Vargas et&#xa0;al., 2015</xref>), and this approach could therefore miss key taxa that are present.</p>
</sec>
<sec id="s3_6">
<title>Quantification of Transcripts</title>
<p>Transcript abundance can be estimated using mRNA standards, as developed for marine prokaryotes (<xref ref-type="bibr" rid="B131">Satinsky et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B53">Gifford et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B132">Satinsky et&#xa0;al., 2017</xref>). In order to determine how much standard to add prior to sample extraction, test filters can be collected and sacrificed from representative stations/depths with differing levels of biomass (chlorophyll <italic>a</italic> fluorescence). Conversely, standards can be added after RNA is extracted, although this &#x201c;quasi-standard&#x201d; would no longer take into account RNA loss during the extraction procedure, and would lead to an overestimate of mRNA abundance.</p>
<p>Transcript abundances can be normalized by the volume filtered to approximate copies L<sup>-1</sup>:</p>
<disp-formula>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>e</mml:mi>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:msub>
<mml:msup>
<mml:mi>L</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>d</mml:mi>
<mml:msub>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xd7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>t</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>s</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#xd7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>k</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>k</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>s</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>s</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#xd7;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mi>v</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>reads<sub>i</sub>
</italic> are the raw read counts of transcript <italic>i</italic>, <italic>spike reads</italic> are the raw read counts associated with the mRNA spike standard, <italic>spike copies</italic> are the amount of mRNA copies (molecules) added to samples prior to sequencing, <italic>total reads</italic> are the number of mRNA reads in the sequence library (minus spike reads), and <italic>volume filtered</italic> is the amount of seawater filtered. Normalized counts may be used (e.g., TPM) in place of raw read counts in these absolute transcript calculations, which would account for transcript length bias (<xref ref-type="bibr" rid="B103">Mortazavi et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B11">Bartholom&#xe4;us et&#xa0;al., 2016</xref>).</p>
</sec>
<sec id="s3_7">
<title>Protein Predictions and Orthologous Group Clustering</title>
<p>Proteins are predicted from assembled contigs (transcripts) through open reading frame (ORF) prediction software, such as <italic>TransDecoder</italic> (transdecoder.github.io) or <italic>GeneMark S-T</italic> (<xref ref-type="bibr" rid="B149">Tang et&#xa0;al., 2015</xref>). If using the metatranscriptome as a reference for a metaproteomic peptide-spectrum-matching (PSM), the ORF predictions are the FASTA database used for PSM scoring (<xref ref-type="bibr" rid="B34">Cohen et&#xa0;al., 2021</xref>).</p>
</sec>
<sec id="s3_8">
<title>Annotations</title>
<sec id="s3_8_1">
<title>Taxonomic Assignments</title>
<p>Assigning taxonomic annotations to contigs allows for examinations into community composition across spatial and temporal gradients, or as a function of experimental perturbations. Taxonomic assignments are performed by aligning assembled contig sequences against a reference database. For identifying marine microeukaryotes in the field, it is key to use a database that includes transcriptomes or genomes from laboratory isolates or environmentally derived single-cell marine microeukaryotes. The MMETSP database includes 678 marine microeukaryote transcriptomes, including phylogenetically diverse and ecologically relevant taxa (<xref ref-type="bibr" rid="B70">Keeling et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B66">Johnson et&#xa0;al., 2019</xref>). Databases including MMETSP references such as EukProt (<xref ref-type="bibr" rid="B122">Richter et&#xa0;al., 2020</xref>), EukZoo (github.com/zxl124/EukZoo-database), and PhyloDB (allenlab.ucsd.edu/data) are valuable resources with additional transcriptomes and genomes present. Sequences may be aligned to these databases using tools such as <italic>BLAST</italic> (<xref ref-type="bibr" rid="B6">Altschul et&#xa0;al., 1990</xref>), <italic>DIAMOND</italic> (<xref ref-type="bibr" rid="B21">Buchfink et&#xa0;al., 2015</xref>), and <italic>MMseqs2</italic> (Steinegger et&#xa0;al., 2017), with quality thresholds commonly used to assess goodness of fit including E-value cutoffs (e.g., E&#xa0;&lt; 10<sup>-5</sup>), high sequence similarity percentage, and/or high bit score. <italic>EUKulele</italic> is a taxonomic annotation tool designed for marine microeukaryotes, and can perform <italic>BLAST</italic> or <italic>DIAMOND</italic> alignment searches against custom or default databases, including MMETSP (<xref ref-type="bibr" rid="B80">Krinos et&#xa0;al., 2021</xref>). For contigs with numerous hits exceeding a quality threshold, a Least Common Ancestor (LCA) approach is used to assign annotations at the lowest common taxonomic level. It is recommended to include marine bacteria, metazoa, and common contaminants in the databases for purposes of identifying these community members, if present, and avoiding misannotation. For example, the default <italic>EUKulele</italic> database includes the MarRef database of marine prokaryotic genomes (<xref ref-type="bibr" rid="B72">Klemetsen et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B80">Krinos et&#xa0;al., 2021</xref>). In addition, using databases containing reference transcriptomes that have been screened for multi-species presence and decontaminated are preferred (<xref ref-type="bibr" rid="B154">Van Vlierberghe et&#xa0;al., 2021</xref>).</p>
<p>It is crucial to remember, however, that we are ultimately limited in identifying taxonomy by what is available in our databases. If eukaryotic organisms captured in field studies are unrelated to cultured representatives included in taxonomic databases, with sufficiently low sequence similarity, they will be unannotated or misannotated. MMETSP has expanded sequence coverage of diatoms, prasinophytes, and dinoflagellates (<xref ref-type="bibr" rid="B70">Keeling et&#xa0;al., 2014</xref>), but a large number of ecologically relevant taxa remain missing from reference databases, especially those from the depths of the ocean where protistan diversity is quite high (<xref ref-type="bibr" rid="B134">Schoenle et&#xa0;al., 2021</xref>). Testing multiple databases containing different protistan reference organisms may be helpful during initial explorations of datasets. Generally, ~40-60% of marine metatranscriptomic contigs can be assigned a taxonomic annotation (e.g., <xref ref-type="bibr" rid="B33">Cohen et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B27">Carradec et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B63">Hu et&#xa0;al., 2018</xref>). The gene expression profiles captured with metatranscriptomics will represent a mixed community cellular state and the community&#x2019;s dominant response to the environment. Considering the vast taxonomic and metabolic diversity across microeukaryotic species, limited reference databases may not fully capture environmentally-relevant features. Moving forward, focused efforts on sequencing additional diverse organisms from rarer lineages and further populating reference databases will improve field identifications.</p>
</sec>
<sec id="s3_8_2">
<title>Functional Assignments</title>
<p>Functional annotation of transcripts enables investigations into ecophysiology, resource exchanges between organisms and the environment, and contributions to elemental cycling. Similar to taxonomic assignments, functions can be assigned <italic>via</italic> sequence homology searches to protein databases including eukaryotic references such as Kyoto Encyclopedia of Genes and Genomes (KEGG) (<xref ref-type="bibr" rid="B68">Kanehisa et&#xa0;al., 2016a</xref>), Eukaryotic Ortholog Groups (KOG) (<xref ref-type="bibr" rid="B150">Tatusov et&#xa0;al., 2003</xref>), and Gene Ontology (GO) (<xref ref-type="bibr" rid="B35">Gene Ontology Consortium, 2004</xref>) using likelihood thresholds (e.g., E&#xa0;&lt; 10<sup>-3</sup>). These databases have the advantage of grouping proteins by higher order function, allowing for broad classification into functional categories. In addition to these approaches, hidden Markov model (HMM) profiles searches executed <italic>via</italic> the <italic>HMMer</italic> software suite (<xref ref-type="bibr" rid="B48">Finn and Clements, 2011</xref>) in conjunction with protein databases [e.g., Pfam (<xref ref-type="bibr" rid="B47">Finn et&#xa0;al., 2014</xref>)] enable the identification of conserved protein domains, which can provide more remote information compared to local alignments. However, these conserved domains are not indicative of whole protein function and are not as easily classified into broader functional categories.</p>
<p>Certain existing tools and workflows perform combinations of the taxonomy and functional annotation steps listed above. For example, <italic>eggNOG-mapper</italic> provides KEGG, GO, Pfam, and other protein annotations as output using <italic>HMMer</italic>, <italic>DIAMOND</italic>, or <italic>MMSeqs2</italic> searches against the eggNOG database (<xref ref-type="bibr" rid="B24">Cantalapiedra et&#xa0;al., 2021</xref>). <italic>KOfamScan</italic> searches query sequences against the KEGG database using HMM profiles (github.com/takaram/kofam_scan). <italic>Trinotate</italic> is a workflow for non-model organisms that carries out assemblies with <italic>Trinity</italic> and annotates using eggNOG, GO, and Pfam, among other databases (<xref ref-type="bibr" rid="B20">Bryant et&#xa0;al., 2017</xref>). Web-based servers are also available (<italic>BlastKOALA, GhostKOALA, KofamKOALA</italic>) which annotate assembly fasta files against the KEGG database using sequence homology or HMM profile searches, in a web user interface (<xref ref-type="bibr" rid="B69">Kanehisa et&#xa0;al., 2016b</xref>). Users may choose an annotation procedure that aligns with their needs, level of automation desired, and preferred computational environment.</p>
</sec>
</sec>
<sec id="s3_9">
<title>Normalizations</title>
<p>Sequence libraries are commonly normalized to account for non-biological variability (e.g., large differences in total number of reads among samples, or library sizes) thereby allowing for relative comparisons across a dataset (<xref ref-type="bibr" rid="B1">Abrams et&#xa0;al., 2019</xref>). Popular RNA-Seq normalization and differential expression tools include <italic>EdgeR</italic> (<xref ref-type="bibr" rid="B125">Robinson and Oshlack, 2010</xref>; <xref ref-type="bibr" rid="B124">Robinson et&#xa0;al., 2010</xref>) and <italic>DESeq2</italic> (<xref ref-type="bibr" rid="B9">Anders &amp; Huber, 2010</xref>; <xref ref-type="bibr" rid="B94">Love et&#xa0;al., 2014</xref>), which correct for RNA composition bias during normalization, and estimate differential expression by fitting generalized linear models and assuming negative binomial distributions. False discovery rate (FDR) controlled p-values are used to account for multiple hypothesis testing within large gene expression datasets (<xref ref-type="bibr" rid="B121">Reiner et&#xa0;al., 2003</xref>). <italic>EdgeR</italic> and <italic>DESeq2</italic> are ideal for comparative analyses in which similar marine communities are subjected to treatments or conditions in order to address experimental hypotheses. These software tools offer dispersion shrinkage estimation and outlier detection to decrease the uncertainty of differential expression annotations (<xref ref-type="bibr" rid="B94">Love et&#xa0;al., 2014</xref>). It is important to note that applying differential expression tools for community-level metatranscriptomic data requires the organization of these data into taxon-specific bins for the purposes of scaling the count matrix, thereby isolating taxon-specific gene expression changes (<xref ref-type="bibr" rid="B73">Klingenberg and Meinicke, 2017</xref>).</p>
<p>These approaches make key assumptions about most genes not being differentially expressed, and care should be taken when comparing disparate marine ecosystems (e.g., surface and deep populations, or surface waters from eastern and western ocean basins). Normalization approaches that merely account for changes in sequence library and differences in contig length, such as Transcripts Per Million (TPM) (<xref ref-type="bibr" rid="B158">Wagner et&#xa0;al., 2012</xref>), may be better suited for large spatial or temporal field studies, although these methods cannot provide statistical estimates of differential expression and may retain transcript composition biases (<xref ref-type="bibr" rid="B31">Cockrum et&#xa0;al., 2020</xref>; see below: <italic>Consolidating assemblies</italic>). Flexible and adaptive statistical techniques that take into consideration zero-inflation, such as Tweedie models, may be useful for metatranscriptomic analyses and are worth exploring in marine omic datasets (<xref ref-type="bibr" rid="B96">Mallick et&#xa0;al., 2021</xref>).</p>
</sec>
<sec id="s3_10">
<title>Workflow Managers</title>
<p>As evident from the above descriptions of typical metatranscriptomic pipelines, many individual computational steps are required. Workflow managers are valuable for the batch execution of commands and processing steps across samples. Individual executions may otherwise be tedious, lead to inconsistencies and/or errors, and fail to be reproducible. Of the open-source workflow managers, <italic>Snakemake</italic> is a popular Python-based user-friendly option with rich documentation available (<xref ref-type="bibr" rid="B78">K&#xf6;ster and Rahmann, 2012</xref>). Many established <italic>Snakemake</italic>-based workflows are publicly available on code sharing repositories such as <italic>GitHub</italic>, and may be a useful starting point. For example, <italic>eukrhythmic</italic> is a scalable metatranscriptomic assembly workflow designed for marine microeukaryotes (<xref ref-type="bibr" rid="B79">Krinos et&#xa0;al., 2022</xref>), and many of the above outlined bioinformatic steps have been incorporated into <italic>eukrhythmic</italic> (github.com/AlexanderLabWHOI/eukrhythmic). In addition, the SqueezeMeta analysis pipeline is suitable for metatranscriptomic assembly and compatible with long read sequences (<xref ref-type="bibr" rid="B148">Tamames and Puente-S&#xe1;nchez, 2019</xref>).</p>
</sec>
</sec>
<sec id="s4">
<title>Consolidating Assemblies</title>
<p>It can be difficult to interpret large assemblies in which tens of millions of contigs are produced from mixed natural communities and most contigs do not correspond to a known protein function. There are several considerations for consolidating assemblies and streamlining the analysis, including orthologous group clustering and functional/taxonomic aggregation.</p>
<p>A subset of assembled metatranscriptomic contigs do not encode proteins due to being fragmented and/or chimeric, and this can be a function of RNA pool composition, sequencing depth, type of assemblers used, and protein prediction algorithms and parameters applied. It can therefore be helpful to remove non-coding sequences by predicting ORFs, and strictly using ORFs for read mapping and the quantitative analysis of taxonomic and functional groups. Orthologous groups (OGs) are commonly used to further collapse proteins into protein clusters derived from common ancestors, performed using tools such as <italic>OrthoFinder</italic> (<xref ref-type="bibr" rid="B46">Emms and Kelly, 2019</xref>), which uses a phylogenetic approach with multiple algorithms to identify relationships between genes and species. In contrast, <italic>OrthoMCL</italic> uses a reciprocal best hits approach with the Markov Clustering Algorithm (MCL) (<xref ref-type="bibr" rid="B153">van Dongen 2000</xref>; <xref ref-type="bibr" rid="B91">Li et&#xa0;al., 2003</xref>). These OGs can be used to track changes in function among closely related protistan taxa. However, one consideration for OG clustering is that it is highly dependent on clustering thresholds (e.g., percent sequence similarity), with stringent parameters limiting cross-species aggregation, and very lax parameters enabling cross-species clustering (<xref ref-type="bibr" rid="B79">Krinos et&#xa0;al., 2022</xref>). OG aggregation may be particularly valuable for collapsing read counts into evolutionarily related taxonomic groups and functional genes, effectively reducing the large assembly into more biologically meaningful groupings.</p>
<p>Aside from OG clustering, another popular approach for condensing assemblies has been to aggregate read counts to a common taxonomic and functional classification. For example, combining reads to the supergroup, class, or family level and KEGG Orthology ID. Read counts can either be collapsed (summed) into taxonomic and functional annotations before normalization, or summed following normalization. Transcript-estimating tools such as <italic>tximport</italic> can automate this step by converting read counts associated with transcripts (contigs) to gene level annotations and generating normalized reads as community-wide TPM (<xref ref-type="bibr" rid="B142">Soneson et&#xa0;al., 2015</xref>). An important consideration is the taxonomic level of interest in which to aggregate counts, and will differ depending on research focus. The primary disadvantage of working at a fine taxonomic resolution (e.g., species) is that fewer sequences can be confidently assigned to such a level, and users may be inundated by the overwhelming number of species to analyze. On the other hand, broad class level annotations (e.g., diatoms, dinoflagellates, haptophytes) are a composite of vastly different organisms, some of which may be responding to the environment in distinct ways (<xref ref-type="bibr" rid="B4">Alexander et&#xa0;al., 2015a</xref>; <xref ref-type="bibr" rid="B82">Lampe et&#xa0;al., 2018</xref>). Testing various taxonomic annotation levels can be helpful in determining the resolution most biologically meaningful for a given dataset. This approach relieves concern about mixing different species or genera into one group, as may occur with OG clustering, and provides taxon-specific counts. However, a key issue is that a significant fraction of coding sequences do not have a known protein function (low sequence similarity to references in databases), similar to observations with assembled genomes and metagenomes (<xref ref-type="bibr" rid="B155">Vanni et&#xa0;al., 2021</xref>). This approach therefore limits biological interpretations to only a fraction of the predicted proteins included in the downstream analysis.</p>
</sec>
<sec id="s5">
<title>Interrogation &amp; Visualization</title>
<p>When working with experimental treatments or pairwise comparative conditions, MA (log ratio-mean average) plots are a straightforward approach for visualization, highlighting highly abundant and variably expressed genes in specific taxa of interest (<xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figure&#xa0;2</bold>
</xref>). These are created by plotting log fold change by average normalized gene expression, and can be generated directly through <italic>EdgeR</italic> and <italic>DESeq2</italic> packages. In addition, MANTA plots are a useful way to depict the MA relationship with pie charts representing the relative breakdown of taxonomic composition for each functional annotation (see github.com/AlexanderLabWHOI/2022-metaT-m3-perspective for code). Fold change comparisons are ideal for visualizing the magnitude of change in expression across samples, which can be difficult to discern from normalized transcript abundance alone. Similarly, volcano plots highlight differentially expressed genes with statistical support by graphing fold change by FDR (<xref ref-type="supplementary-material" rid="SF2">
<bold>Supplementary Figure&#xa0;2</bold>
</xref>). Datasets from spatial and temporal studies may also be averaged across time or space zonations to visualize in MA plots, for example by averaging gene expression across all surface and deep communities. However, these broad groupings may conceal biologically relevant patterns across environmental features. In conjunction with these, exploratory approaches may be used to find structure across latitudes and depth, including ordinations, clustered heatmaps, and network analyses.</p>
<p>Ordinations are used to distill multidimensional data into two or three dimensions for visualization. Omic data is highly dimensional, with the number of annotated genes commonly reaching the thousands. Popular unconstrained ordination approaches include Principal Component Analysis (PCA) based on Euclidean distance, Principal Coordinate Analysis (PCoA) compatible with other forms of dissimilarity measurements, and Nonmetric Multidimensional Scaling (NMDS) which ranks distances in nonlinear space iteratively (<xref ref-type="bibr" rid="B119">Ramette, 2007</xref>). With these unconstrained ordinations, the relationship between metadata and ordination space can be assessed, for example using the <italic>envfit</italic> function of <italic>vegan</italic> (<xref ref-type="bibr" rid="B41">Dixon, 2003</xref>). Constrained ordinations such as Canonical Correlation Analysis (CCA) and Redundancy Analysis (RDA) can be used to evaluate how transcriptional profiles change across sample groups according to metadata, such as environmental measurements or categorical variables (<xref ref-type="bibr" rid="B119">Ramette, 2007</xref>). (See github.com/AlexanderLabWHOI/2022-metaT-m3-perspective for example CCA ordination tutorial). Broadly, these approaches can be used to find similarities in gene expression profiles across sample types and/or relate transcript levels to environmental conditions. Ordination plots have been utilized to show time-dependent patterns in microeukaryote gene expression (<xref ref-type="bibr" rid="B58">Groussman et&#xa0;al., 2021</xref>), taxon-specific microeukaryote functional profiles (<xref ref-type="bibr" rid="B63">Hu et&#xa0;al., 2018</xref>), and differences in surface and deep dinoflagellate metatranscriptome profiles (<xref ref-type="bibr" rid="B34">Cohen et&#xa0;al., 2021</xref>). The input data for ordinations may be normalized read counts associated with annotated or unannotated transcripts at the community level (e.g., community-wide TPM), or normalized at a given taxonomic level of interest (e.g., haptophytes).</p>
<p>Gene expression profiles can be effectively compared across samples using heatmaps, clustered using a statistical similarity metric and highlighting relationships among treatment groups, ocean regions, or temporal dimensions. Typically, columns represent individual samples, rows represent genes, and colors represent normalized read counts. These heatmaps can include all genes within the expression profile or subset to highlight specific genes of interest. Care should be taken when subsetting expression profiles to include differentially expressed genes, because in the absence of biostatistical tests, differential expression cannot be reliably determined. Transcripts with the highest variances can be calculated, but this will be biased towards highly expressed genes since variance increases with transcript abundance in a heteroscedastic manner (<xref ref-type="bibr" rid="B87">Law et&#xa0;al., 2014</xref>). It is therefore recommended to correct for the mean-variance relationship (as performed by <italic>EdgeR</italic> and <italic>DESeq2</italic>) or perform a transformation such as log normalization; however, log-normalizing prior to calculating variance can have the opposite effect and result in high variances of lowly expressed genes. Normalizations that effectively control for heteroscedasticity, such as the variance stabilizing transformation, are recommended to improve differential expression assessments (<xref ref-type="bibr" rid="B168">Zwiener et&#xa0;al., 2014</xref>).</p>
<p>Marine metatranscriptomic datasets can be quite large, consisting of billions of reads, millions of contigs, and thousands of annotated genes. Network analyses can be used to identify ecological connections between taxonomic groups, associations among functional processes, and/or link environmental metadata with expression patterns. This approach has been used to characterize the nutrient status of phytoplankton along an estuary gradient (<xref ref-type="bibr" rid="B56">Gong et&#xa0;al., 2018</xref>), identify diel metabolic patterns across protists (<xref ref-type="bibr" rid="B76">Kolody et&#xa0;al., 2019</xref>), and reveal co-occurrences between limiting resources and protistan taxa (<xref ref-type="bibr" rid="B25">Caputi et&#xa0;al., 2019</xref>). Ecological network analyses are frequently performed with Weighted Gene Correlation Network Analysis (<italic>WGCNA)</italic> (<xref ref-type="bibr" rid="B83">Langfelder and Horvath, 2008</xref>), <italic>igraph</italic> (<xref ref-type="bibr" rid="B36">Csardi and Nepusz, 2006</xref>), and <italic>sparCC</italic> (<xref ref-type="bibr" rid="B50">Friedman and Alm, 2012</xref>), with <italic>Cytoscape</italic> software commonly used for visualization of networks and interactions following creation (<xref ref-type="bibr" rid="B139">Shannon et&#xa0;al., 2003</xref>). Input data may be annotated transcripts with taxonomic and functional assignments and normalized read counts at the community level, and output is clusters or modules of closely related (co-occurring) associations defined by user-specified thresholds. These modules can be correlated with metadata to understand environmental conditions influencing taxonomic and/or metabolic processes. In particular, KEGG or GO-enrichments can be performed on modules to expand on how functional profiles are biologically, spatially or temporally organized.</p>
<p>Section plots, or 2D maps, are used to visualize changes in relative (normalized) or quantitative (copies L<sup>-1</sup>) gene expression across lateral and vertical expanses. This type of visualization is especially useful if high resolution sampling along transects was performed. Section plots can be generated using <italic>matplotlib</italic> library in Python (<xref ref-type="bibr" rid="B128">Saito et&#xa0;al., 2020</xref>), <italic>oce</italic> package in R (dankelley.github.io/oce), or software such as <italic>Ocean Data View</italic> (<xref ref-type="bibr" rid="B133">Schlitzer, 2018</xref>). This visualization method can highlight shifts in metabolic processes across depths, nutrient conditions, temperature regimes, or biomes (e.g., <xref ref-type="bibr" rid="B127">Saito et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B130">Santoro et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B61">Hogle et&#xa0;al., 2021</xref>). Highlighted genes may include those with strongly varying expression between zonations, or individual genes of interest hypothesized to be comparatively responsive to environmental conditions, such as biomarkers of nutrient stress (<xref ref-type="bibr" rid="B127">Saito et&#xa0;al., 2014</xref>). It is recommended to be cautious when interpreting weak and/or variable signals from genes that are not highly expressed, especially when biological replication is not available.</p>
</sec>
<sec id="s6">
<title>Tips For Getting Started</title>
<p>As discussed above, the learning curve associated with bioinformatics can be steep, and many resources exist to aid in the process. The Carpentries is an international organization that teaches foundational coding principles to learners of any background, with educational materials publicly available online (<xref ref-type="bibr" rid="B163">Wilson, 2006</xref>). Their lessons can equip users with basic knowledge of Unix, Python, and R, with more advanced concepts also available, including genomics, ecology and graphical visualizations (datacarpentry.org/lessons, software-carpentry.org/lessons). Additionally, universities with high performance computing clusters commonly have coding training sessions available to users. Specifically for microbiologists, the community initiative Bioinformatics Virtual Coordination Network (BVCN) aims to teach core coding and bioinformatic skills needed for omic analyses through publicly accessible lessons, tutorials, and video content available online (<xref ref-type="bibr" rid="B151">Tully et&#xa0;al., 2021</xref>). Lastly, it is key to learn how to effectively troubleshoot while coding, and user-based discussion boards are excellent venues for discovering how others have solved similar problems, asking questions, and sharing solutions. <italic>Biostars.org</italic>, <italic>Stackoverflow.com</italic>, and <italic>Github Issues</italic> have been invaluable community resources during our own bioinformatic development.</p>
</sec>
<sec id="s7">
<title>Future Directions</title>
<p>The guidelines and considerations presented here reflect the current methodology used to analyze microeukaryotic metatranscriptomes, but approaches will evolve as new tools, pipelines and databases come online. Users are encouraged to keep up with new versions of released databases and tools, and check documentation often to incorporate updates in computational steps (i.e., improved efficiency or accuracy, bug-fixes). In particular, focused community efforts on transcriptome sequencing of phylogenetically diverse protists will improve metatranscriptomic databases and strengthen our ability to track natural populations in the field. Single-cell transcriptomics (sc-RNA-Seq) performed on uncultured organisms isolated from the field will be especially valuable in expanding taxonomic and functional sequence coverage of microeukaryotes from complex communities (<xref ref-type="bibr" rid="B162">Wilms, 2021</xref>; <xref ref-type="bibr" rid="B75">Kolody et&#xa0;al., 2022</xref>).</p>
<p>Importantly, third generation sequencing technologies are promising avenues for microbial ecology that have rapidly developed over the past few years. Nanopore sequencing <italic>via</italic> the portable MinION and benchtop promethION platforms (Oxford Nanopore Technologies) and PacBio Single-Molecule Real-Time (SMRT) sequencing (Pacific Biosciences of California) will enable full length transcripts to be sequenced from mixed natural assemblages, without PCR amplification, short-read assemblies, and associated biases. Existing bioinformatic workflows will need to be updated to accommodate this new sequencing technology, as many publicly available workflows are currently designed for short read sequencing products obtained through Illumina technology. Increasingly, protocols are being developed for a combination of short and long read transcriptome sequencing of marine phytoplankton (<xref ref-type="bibr" rid="B144">Sperfeld et&#xa0;al., 2021</xref>).</p>
<p>The protocols outlined here have been compiled from individual studies, which are the result of years of experience at sea, in labs, and on the command line. As discussed above, there are multiple options for carrying out each step of the process, from seawater collection to bioinformatic handling. We currently lack an understanding of how the different, yet congruent, methods influence the downstream analyses and biological interpretations. A community intercalibration exercise in which multiple research groups analyze the same initial natural community using their various preferred sampling, laboratory and computational pipelines would advance our understanding of how methodology influences results, and would increase confidence in chosen practices. This is one of the goals recently discussed at the &#x201c;<italic>Ocean Nucleic Acids Omics Intercalibration and Standardization</italic>&#x201d; workshop funded by the National Science Foundation&#x2019;s Ocean Carbon &amp; Biogeochemistry (OCB) Program (<xref ref-type="bibr" rid="B14">Berube et&#xa0;al., 2022</xref>). The workshop report provides a roadmap for such activities, including intercalibration efforts for a variety of marine omics applications, with additional sampling and processing considerations not covered here (<xref ref-type="bibr" rid="B14">Berube et&#xa0;al., 2022</xref>). Such activities are critical for the development of future coordinated large oceanographic international programs, such as BioGeoSCAPES (<uri xlink:href="http://www.biogeoscapes.org">www.biogeoscapes.org</uri>).</p>
<p>Valuable insights have been provided by microeukaryote metatranscriptomic studies to date, and exciting discoveries certainly await us in the coming years as the approach continues to be applied to diverse ecosystems and integrated with complementary methods. A eukaryotic gene catalog consisting of over 116 million expressed genes has been recently generated from the ocean, expanding our understanding of protistan biogeography and physiology as a function of environmental conditions (<xref ref-type="bibr" rid="B27">Carradec et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B25">Caputi et&#xa0;al., 2019</xref>). Intriguingly, half of the gene functions are not annotated, and targeted efforts into protein characterization will drastically improve our understanding of protistan ecology and their biogeochemical roles (<xref ref-type="bibr" rid="B27">Carradec et&#xa0;al., 2018</xref>). There is furthermore value in combining marine metatranscriptomics with traditional physiological and chemical approaches (<xref ref-type="bibr" rid="B97">Marchetti, 2019</xref>; <xref ref-type="bibr" rid="B162">Wilms, 2021</xref>; <xref ref-type="bibr" rid="B75">Kolody et&#xa0;al., 2022</xref>), which can strengthen and guide biogeochemical interpretations, for example in relating metatranscriptomic community composition to microscope-derived cell counts or gene expression to empirically measured enzymatic rates. Integration of metatranscriptomic information with metaproteomics enables a broader view of protistan cell metabolism (<xref ref-type="bibr" rid="B34">Cohen et&#xa0;al., 2022</xref>), with recent modeling efforts offering a mechanistic understanding of the relationships between environmentally responsive transcripts and proteins in marine microbes (<xref ref-type="bibr" rid="B159">Walworth et&#xa0;al., 2022</xref>). Similar pairings with metabolomics and/or lipidomics hold promise for relating taxonomic groups and metabolic processes to released organics, revealing trophic interactions among community members and nutrient utilization patterns (<xref ref-type="bibr" rid="B43">Durham et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B60">Heal et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B106">Muratore et&#xa0;al., 2022</xref>). Continuing to integrate and apply metatranscriptomics to biogeochemically complex and understudied marine ecosystems will undoubtedly shed light on the diverse roles marine protists play across our ocean biomes.</p>
</sec>
<sec id="s8" sec-type="author-contributions">
<title>Author Contributions</title>
<p>NC, HA, and AK conceived of the review. SH and RL generated coding resources. NC wrote the first draft. All authors contributed to the intellectual content, writing, and revising of the manuscript. All authors approved the submitted version.</p>
</sec>
<sec id="s9" sec-type="funding-information">
<title>Funding</title>
<p>We acknowledge funding support from the University of Georgia Skidaway Institute of Oceanography (to NRC), National Science Foundation (NSF) (OCE-1948025 to HA), and Department of Energy Computational Science Graduate Fellowship (DE-SC0020347 to AIK). SKH participation was supported through NSF OCE-1947776.</p>
</sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack>
<title>Acknowledgments</title>
<p>We graciously thank Adrian Marchetti (UNC) for valuable feedback on the manuscript.</p>
</ack>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmars.2022.867007/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmars.2022.867007/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Image_1.tif" id="SF1" mimetype="image/tiff">
<label>Supplementary Figure&#xa0;1</label>
<caption>
<p>Example research questions and analysis recommendations. The standard bioinformatic workflow is used to produce the intermediate products (assembly, annotations, read mappings, etc.), but normalization and visualization strategies differ depending on research question. *Note that either non-normalized raw reads or community-wide TPM may be used for relative community composition visualization with stacked barplots, but normalized counts (taking into account differences in library sizes) is recommended for ordinations.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image_2.tif" id="SF2" mimetype="image/tiff">
<label>Supplementary Figure&#xa0;2</label>
<caption>
<p>Example MA and volcano plots for visualizing differential expression. MA plot <bold>(A)</bold>: MA plot shows the mean fold change versus mean expression with both measures on a log<sub>2</sub> scale. Genes above the horizontal dashed line represent genes with increased expression in one treatment (numerator in the fold change calculation) and genes below represent increased expression in the other treatment (denominator in the fold change calculation). Additional modifications can aid in visualizing differentially expressed genes. For example, this plot shows genes that are not significantly differentially expressed as gray points while genes that are significantly differentially expressed are black points (P &lt; 0.05). Data points with extremely high fold change values are plotted as triangles rather than circles. In this example, those are genes with log<sub>2</sub> fold change values greater than 5 or less than -5. The size of the points is scaled by -log<sub>10</sub>(p-value) such that lower p-values are larger points. Although not shown here, genes of interest can be color-coded and/or labeled directly if desired. One simple and popular coloration is to show the significantly up- or down-regulated genes as two different colors, for example, red and blue respectively. MANTA plot <bold>(B)</bold>: This plot is a modification of the MA plot and was introduced by <xref ref-type="bibr" rid="B98">Marchetti et&#xa0;al., 2012</xref>. The original plotting function was released as part of the manta (Microbial Assemblage Normalized Transcript Analysis) package in Bioconductor; however, use of this package to generate plots restricts users to use MANTA objects and lacks features such as the ability to handle replicates. As a result, new plotting functions inspired by the original were re-written and are available on Github (github.com/AlexanderLabWHOI/2022-metaT-m3-perspective). Here, genes that are significantly differentially expressed are shown as pie charts rather than plain black circles to display that taxonomic breakdown of the genes. This example uses the same data as the MA plot example, but now, different diatom genera are shown. Depending on the user&#x2019;s analysis, different groups and/or taxonomic-levels can be used. The use of the triangles as shown in the MA plot was omitted for this plot, but extremely high log<sub>2</sub> fold change values are 5 or -5. Volcano plot <bold>(C)</bold>: Rather than highlighting the mean abundance of a gene as in the MA plot, the volcano plot emphasizes the statistical significance (p-value) of genes between two treatments. Here, genes to the right of the horizontal dashed line represent genes with increased expression in one treatment (numerator in the fold change calculation) and genes to the left represent increased expression in the other treatment (denominator in the fold change calculation). Only genes above the horizontal dashed line, -log<sub>10</sub>(0.05) representing &#x3b1; = 0.05, are shown in black while genes below it are shown in gray to distinguish between points that are significantly differentially expressed or not as in the MA plot. Data points with extremely low p-values and thus are high on the y-axis are plotted as triangles rather than circles. In this example, those are genes with P &lt; 0.00001. As with the MA plot, additional color coding may be performed and may be as simple as coloring all the genes in the left treatment blue and genes in the right treatment red. Genes of interest can also be color-coded and/or labeled directly if desired.</p>
</caption>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abrams</surname> <given-names>Z. B.</given-names>
</name>
<name>
<surname>Johnson</surname> <given-names>T. S.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Payne</surname> <given-names>P. R. O.</given-names>
</name>
<name>
<surname>Coombes</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A Protocol to Evaluate RNA Sequencing Normalization Methods</article-title>. <source>BMC Bioinf.</source> <volume>20</volume>, <fpage>679</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12859-019-3247-x</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alberti</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Poulain</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Engelen</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Labadie</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Romac</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ferrera</surname> <given-names>I.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Viral to Metazoan Marine Plankton Nucleotide Sequences From the Tara Oceans Expedition</article-title>. <source>Sci. Data</source> <volume>4</volume>, <fpage>170093</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/sdata.2017.93</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alexander</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Krinos</surname> <given-names>A. I.</given-names>
</name>
<name>
<surname>Pachiadaki</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Tully</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Neely</surname> <given-names>C. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Eukaryotic Genomes From a Global Metagenomic Dataset Illuminate Trophic Modes and Biogeography of Ocean Plankton</article-title>. <source>bioRxiv</source> doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2021.07.25.453713</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alexander</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Jenkins</surname> <given-names>B. D.</given-names>
</name>
<name>
<surname>Rynearson</surname> <given-names>T. A.</given-names>
</name>
<name>
<surname>Dyhrman</surname> <given-names>S. T.</given-names>
</name>
</person-group> (<year>2015</year>a). <article-title>Metatranscriptome Analyses Indicate Resource Partitioning Between Diatoms in the Field</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>112</volume>, <fpage>E2182</fpage>&#x2013;<lpage>E2190</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.1421993112</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alexander</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Rouco</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Haley</surname> <given-names>S. T.</given-names>
</name>
<name>
<surname>Wilson</surname> <given-names>S. T.</given-names>
</name>
<name>
<surname>Karl</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Dyhrman</surname> <given-names>S. T.</given-names>
</name>
</person-group> (<year>2015</year>b). <article-title>Functional Group-Specific Traits Drive Phytoplankton Dynamics in the Oligotrophic Ocean</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>112</volume>, <fpage>E5972</fpage>&#x2013;<lpage>E5979</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.1518165112</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Altschul</surname> <given-names>S. F.</given-names>
</name>
<name>
<surname>Gish</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Myers</surname> <given-names>E. W.</given-names>
</name>
<name>
<surname>Lipman</surname> <given-names>D. J.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>Basic Local Alignment Search Tool</article-title>. <source>J. Mol. Biol.</source> <volume>215</volume>, <fpage>403</fpage>&#x2013;<lpage>410</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0022-2836(05)80360-2</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alvarez</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Schrey</surname> <given-names>A. W.</given-names>
</name>
<name>
<surname>Richards</surname> <given-names>C. L.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Ten Years of Transcriptomics in Wild Populations: What Have We Learned About Their Ecology and Evolution</article-title>? <source>Mol. Ecol</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/mec.13055</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ambardar</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Gupta</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Trakroo</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Lal</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Vakhlu</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>High Throughput Sequencing: An Overview of Sequencing Chemistry</article-title>. <source>Indian J. Microbiol.</source> <volume>56</volume>, <fpage>394</fpage>&#x2013;<lpage>404</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12088-016-0606-4</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anders</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Huber</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Differential Expression Analysis for Sequence Count Data</article-title>. <source>Genome Biol.</source> <volume>11</volume>, <fpage>R106</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/gb-2010-11-10-r106</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baker</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Sheik</surname> <given-names>C. S.</given-names>
</name>
<name>
<surname>Taylor</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Jain</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Bhasi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Cavalcoli</surname> <given-names>J. D.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title>Community Transcriptomic Assembly Reveals Microbes That Contribute to Deep-Sea Carbon and Nitrogen Cycling</article-title>. <source>ISME J</source> <volume>7</volume>, <page-range>1962&#x2013;73</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ismej.2013.85</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bartholom&#xe4;us</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Fedyunin</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Feist</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Sin</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Valleriani</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Bacteria Differently Regulate mRNA Abundance to Specifically Respond to Various Stresses</article-title>. <source>Phil. Trans. R. Soc. A</source> <volume>374</volume>: <elocation-id>20150069</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1098/rsta.2015.0069</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Becker</surname> <given-names>K. W.</given-names>
</name>
<name>
<surname>Harke</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Mende</surname> <given-names>D. R.</given-names>
</name>
<name>
<surname>Muratore</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Weitz</surname> <given-names>J. S.</given-names>
</name>
<name>
<surname>DeLong</surname> <given-names>E. F.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Combined Pigment and Metatranscriptomic Analysis Reveals Highly Synchronized Diel Patterns of Phenotypic Light Response Across Domains in the Open Oligotrophic Ocean</article-title>. <source>ISME J.</source> <volume>15</volume>, <fpage>520</fpage>&#x2013;<lpage>533</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41396-020-00793-x</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bertrand</surname> <given-names>E. M.</given-names>
</name>
<name>
<surname>McCrow</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Moustafa</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>McQuaid</surname> <given-names>J. B.</given-names>
</name>
<name>
<surname>Delmont</surname> <given-names>T. O.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Phytoplankton-Bacterial Interactions Mediate Micronutrient Colimitation at the Coastal Antarctic Sea Ice Edge</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>112</volume>, <fpage>9938</fpage>&#x2013;<lpage>9943</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1501615112</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Berube</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Gifford</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hurwitz</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Jenkins</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Marchetti</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Santoto</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <source>Roadmap Towards Communitywide Intercalibration and Standardization of Ocean Nucleic Acids &#x2018;Omics Measurements</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1575/1912/28054</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Biller</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>Berube</surname> <given-names>P. M.</given-names>
</name>
<name>
<surname>Dooley</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Satinsky</surname> <given-names>B. M.</given-names>
</name>
<name>
<surname>Hackl</surname> <given-names>T.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Marine Microbial Metagenomes Sampled Across Space and Time</article-title>. <source>Sci. Data</source> <volume>5</volume>, <fpage>180176</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/sdata.2018.176</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Blaxter</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Mieszkowska</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Di Palma</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Holland</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Durbin</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Richards</surname> <given-names>T.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Sequence Locally, Think Globally: The Darwin Tree of Life Project</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>119</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2115642118</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bolger</surname> <given-names>A. M.</given-names>
</name>
<name>
<surname>Lohse</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Usadel</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Trimmomatic: A Flexible Trimmer for Illumina Sequence Data</article-title>. <source>Bioinformatics</source> <volume>30</volume>, <fpage>2114</fpage>&#x2013;<lpage>2120</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btu170</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bray</surname> <given-names>N. L.</given-names>
</name>
<name>
<surname>Pimentel</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Melsted</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Pachter</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Near-Optimal Probabilistic RNA-Seq Quantification</article-title>. <source>Nat. Biotechnol.</source> <volume>34</volume>, <fpage>525</fpage>&#x2013;<lpage>527</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nbt.3519</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breier</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Jakuba</surname> <given-names>M. V.</given-names>
</name>
<name>
<surname>Saito</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Dick</surname> <given-names>G. J.</given-names>
</name>
<name>
<surname>Grim</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>Chan</surname> <given-names>E. W.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Revealing Ocean-Scale Biochemical Structure With a Deep-Diving Vertical Profiling Autonomous Vehicle</article-title>. <source>Sci. Robot.</source> <volume>5</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/scirobotics.abc7104</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bryant</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Johnson</surname> <given-names>K.</given-names>
</name>
<name>
<surname>DiTommaso</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Tickle</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Couger</surname> <given-names>M. B.</given-names>
</name>
<name>
<surname>Payzin-Dogru</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>A Tissue-Mapped Axolotl <italic>De Novo</italic> Transcriptome Enables Identification of Limb Regeneration Factors</article-title>. <source>Cell Rep</source> <volume>18</volume>(<issue>3</issue>):<page-range>762&#x2013;76</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.celrep.2016.12.063</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buchfink</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Huson</surname> <given-names>D. H.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Fast and Sensitive Protein Alignment Using DIAMOND</article-title>. <source>Nat. Methods</source> <volume>12</volume>, <fpage>59</fpage>&#x2013;<lpage>60</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.3176</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bushmanova</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Antipov</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Lapidus</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Prjibelski</surname> <given-names>A. D.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Rnaspades: A <italic>De Novo</italic> Transcriptome Assembler and Its Application to RNA-Seq Data</article-title>. <source>Gigascience</source> <volume>8</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gigascience/giz100</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bush</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>McCulloch</surname> <given-names>M. E. B.</given-names>
</name>
<name>
<surname>Summers</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Hume</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>E. L.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Integration of Quantitated Expression Estimates From polyA-Selected and rRNA-Depleted RNA-Seq Libraries</article-title>. <source>BMC Bioinf.</source> <volume>18</volume>, <fpage>301</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12859-017-1714-9</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cantalapiedra</surname> <given-names>C. P.</given-names>
</name>
<name>
<surname>Hern&#xe1;ndez-Plaza</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Letunic</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Huerta-Cepas</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>a). <article-title>eggNOG-Mapper V2: Functional Annotation, Orthology Assignments, and Domain Prediction at the Metagenomic Scale</article-title>. <source>Mol. Biol. Evol.</source> doi: <pub-id pub-id-type="doi">10.1093/molbev/msab293</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Caputi</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Carradec</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Eveillard</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Kirilovsky</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Pelletier</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Pierella Karlusich</surname> <given-names>J. J</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Community-Level Responses to Iron Availability in Open Ocean Planktonic Ecosystems</article-title>. <source>Global Biogeochem. Cycle</source> <volume>33</volume>(<issue>3</issue>) <fpage>391</fpage>&#x2013;<lpage>419</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2018GB006022</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Caron</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Alexander</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>A. E.</given-names>
</name>
<name>
<surname>Archibald</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Armbrust</surname> <given-names>E. V.</given-names>
</name>
<name>
<surname>Bachy</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Probing the Evolution, Ecology and Physiology of Marine Protists Using Transcriptomics</article-title>. <source>Nat. Rev. Microbiol</source> <volume>15</volume>, <fpage>6</fpage>&#x2013;<lpage>20</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrmicro.2016.160</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carradec</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Pelletier</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Da Silva</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Alberti</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Seeleuthner</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Blanc-Mathieu</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>A Global Ocean Atlas of Eukaryotic Genes</article-title>. <source>Nat. Commun.</source> <volume>9</volume>, <fpage>373</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-017-02342-1</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cerdan-Garcia</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Baylay</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Polyviou</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Woodward</surname> <given-names>E. M. S.</given-names>
</name>
<name>
<surname>Wrightson</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Mahaffey</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Transcriptional Responses of Trichodesmium to Natural Inverse Gradients of Fe and P Availability</article-title>. <source>ISME J</source> <volume>16</volume>, <page-range>1055&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41396-021-01151-1</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Kwan</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Watt</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Paired rRNA-Depleted and polyA-Selected RNA Sequencing Data and Supporting Multi-Omics Data From Human T Cells</article-title>. <source>Sci. Data</source> <volume>7</volume>, <fpage>376</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41597-020-00719-4</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="book">
<person-group person-group-type="editor">
<name>
<surname>Clementson</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Eriksen</surname> <given-names>R. S.</given-names>
</name>
</person-group> (Eds.). &#x201c;<article-title>Kolody, B. C., Harke, M. J., Hook, S. E., and Allen, A. E</article-title>
<article-title>). &#x201c;Chapter 13 - Transcriptomic and Metatranscriptomic Approaches in Phytoplankton: Insights and Advances,&#x201d;</article-title>,&#x201d; in <source>A. B. T.-A. @ in P. E. Willis</source> (<publisher-name>Elsevier</publisher-name>), <fpage>435</fpage>&#x2013;<lpage>485</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/B978-0-12-822861-6.00022-4</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cockrum</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Kaneshiro</surname> <given-names>K. R.</given-names>
</name>
<name>
<surname>Rechtsteiner</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Tabuchi</surname> <given-names>T. M.</given-names>
</name>
<name>
<surname>Strome</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A Primer for Generating and Using Transcriptome Data and Gene Sets</article-title>. <source>Dev</source> <volume>147</volume>(<issue>24</issue>):<elocation-id>dev193854</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1242/dev.193854</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Coesel</surname> <given-names>S. N.</given-names>
</name>
<name>
<surname>Durham</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Groussman</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Caron</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Morales</surname> <given-names>R. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Diel Transcriptional Oscillations of Light-Sensitive Regulatory Elements in Open-Ocean Eukaryotic Plankton Communities</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>118</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2011038118</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname> <given-names>N. R.</given-names>
</name>
<name>
<surname>Ellis</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Lampe</surname> <given-names>R. H.</given-names>
</name>
<name>
<surname>McNair</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Twining</surname> <given-names>B. S.</given-names>
</name>
<name>
<surname>Maldonado</surname> <given-names>M. T.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Diatom Transcriptional and Physiological Responses to Changes in Iron Bioavailability Across Ocean Provinces</article-title>. <source>Front. Mar. Sci.</source> <volume>4</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2017.00360</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname> <given-names>N. R.</given-names>
</name>
<name>
<surname>McIlvin</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Held</surname> <given-names>N. A.</given-names>
</name>
<name>
<surname>Saunders</surname> <given-names>J. K.</given-names>
</name>
<name>
<surname>Hawco</surname> <given-names>N. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Dinoflagellates Alter Their Carbon and Nutrient Metabolic Strategies Across Environmental Gradients in the Central Pacific Ocean</article-title>. <source>Nat. Microbiol.</source> <volume>6</volume>, <fpage>173</fpage>&#x2013;<lpage>186</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41564-020-00814-7</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Consortium</surname> <given-names>G. O.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>The Gene Ontology (GO) Database and Informatics Resource</article-title>. <source>Nucleic Acids Res.</source> <volume>32</volume>, <fpage>D258</fpage>&#x2013;<lpage>D261</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkh036</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Csardi</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Nepusz</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>The Igraph Software Package for Complex Network Research</article-title>. <source>InterJournal Complex Syst</source>.</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cui</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Xin</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Gong</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2010</year>). <article-title>A Comparison Between Ribo-Minus RNA-Sequencing and polyA-Selected RNA-Sequencing</article-title>. <source>Genomics</source> <volume>96</volume>, <fpage>259</fpage>&#x2013;<lpage>265</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ygeno.2010.07.010</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Delmont</surname> <given-names>T. O.</given-names>
</name>
<name>
<surname>Gaia</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hinsinger</surname> <given-names>D. D.</given-names>
</name>
<name>
<surname>Fr&#xe9;mont</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Vanni</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Fernandez-Guerra</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Functional Repertoire Convergence of Distantly Related Eukaryotic Plankton Lineages Abundant in the Sunlit Ocean</article-title>. <source>Cell Genomics</source>, <volume>2</volume>:<fpage>100123</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.xgen.2022.100123</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Derelle</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Ferraz</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Rombauts</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Rouz&#xe9;</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Worden</surname> <given-names>A. Z.</given-names>
</name>
<name>
<surname>Robbens</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2006</year>). <article-title>Genome Analysis of the Smallest Free-Living Eukaryote Ostreococcus Tauri Unveils Many Unique Features</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>103</volume>, <fpage>11647</fpage>&#x2013;<lpage>11652</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0604795103</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Vargas</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Audic</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Henry</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Decelle</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Mah&#xe9;</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Logares</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Eukaryotic Plankton Diversity in the Sunlit Ocean</article-title>. <source>Science</source> <volume>348</volume>, <fpage>6237</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1261605</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dixon</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>VEGAN, a Package of R Functions for Community Ecology</article-title>. <source>J.&#xa0;Veg. Sci.</source> <volume>14</volume>, <fpage>927</fpage>&#x2013;<lpage>930</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1654-1103.2003.tb02228.x</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dupont</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Mccrow</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Valas</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Moustafa</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Walworth</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Goodenough</surname> <given-names>U.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Genomes and Gene Expression Across Light and Productivity Gradients in Eastern Subtropical Pacific Microbial Communities</article-title>. <source>ISME J.</source> <volume>9</volume>, <fpage>1076</fpage>&#x2013;<lpage>1092</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ismej.2014.198</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Durham</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Sharma</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>C. B.</given-names>
</name>
<name>
<surname>Amin</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>Bender</surname> <given-names>S. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Cryptic Carbon and Sulfur Cycling Between Surface Ocean Plankton</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>112</volume>, <fpage>453</fpage>&#x2013;<lpage>457</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1413137112</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Edgcomb</surname> <given-names>V. P.</given-names>
</name>
<name>
<surname>Taylor</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Pachiadaki</surname> <given-names>M. G.</given-names>
</name>
<name>
<surname>Honjo</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Engstrom</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Yakimov</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Comparison of Niskin vs. <italic>In Situ</italic> Approaches for Analysis of Gene Expression in Deep Mediterranean Sea Water Samples</article-title>. <source>Deep. Res. Part II. Top. Stud. Oceanogr</source> <volume>129</volume>, <page-range>213&#x2013;22</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.dsr2.2014.10.020</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ellis</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>N. R.</given-names>
</name>
<name>
<surname>Moreno</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Marchetti</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Cobalamin-independent Methionine Synthase Distribution and Influence on Vitamin B12 Growth Requirements in Marine Diatoms</article-title>. <source>Protist</source> <volume>168</volume>, <fpage>32</fpage>&#x2013;<lpage>47</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.protis.2016.10.007</pub-id>.</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Emms</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Kelly</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>OrthoFinder: Phylogenetic Orthology Inference for Comparative Genomics</article-title>. <source>Genome Biol.</source> <volume>20</volume>, <fpage>238</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-019-1832-y</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Finn</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Bateman</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Clements</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Coggill</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Eberhardt</surname> <given-names>R. Y.</given-names>
</name>
<name>
<surname>Eddy</surname> <given-names>S. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>Pfam: The Protein Families Database</article-title>. <source>Nucleic Acids Res.</source> <volume>42</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkt1223</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Finn</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Clements</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>And Eddy, s</article-title>
<article-title>HMMER Web Server: Interactive Sequence Similarity Searching</article-title>. <source>R. Nucleic Acids Res.</source> <volume>39</volume>, <fpage>W29</fpage>&#x2013;<lpage>W37</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkr367</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Frias-Lopez</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tyson</surname> <given-names>G. W.</given-names>
</name>
<name>
<surname>Coleman</surname> <given-names>M. L.</given-names>
</name>
<name>
<surname>Schuster</surname> <given-names>S. C.</given-names>
</name>
<name>
<surname>Chisholm</surname> <given-names>S. W</given-names>
</name>
<etal/>
</person-group>. (<year>2008</year>). <article-title>Microbial Community Gene Expression in Ocean Surface Waters</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>105</volume>(<issue>10</issue>), <page-range>3805&#x2013;10</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0708897105</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Friedman</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Alm</surname> <given-names>E. J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Inferring Correlation Networks From Genomic Survey Data</article-title>. <source>PloS Comput. Biol.</source> <volume>8</volume>, <elocation-id>e1002687</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pcbi.1002687</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gallego Romero</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Pai</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Tung</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Gilad</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>RNA-Seq: Impact of RNA Degradation on Transcript Quantification</article-title>. <source>BMC Biol.</source> <volume>12</volume>, <fpage>42</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1741-7007-12-42</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garcia</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Batut</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Burke</surname> <given-names>M. L.</given-names>
</name>
<name>
<surname>Kuzak</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Psomopoulos</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Arcila</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Ten Simple Rules for Making Training Materials FAIR</article-title>. <source>PloS Comput. Biol.</source> <volume>16</volume>, <elocation-id>e1007854</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pcbi.1007854</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gifford</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Satinsky</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>M. A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Quantitative Microbial Metatranscriptomics</article-title>. <source>Methods Mol. Biol</source> <volume>1096</volume>:<page-range>213&#x2013;29</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-62703-712-9_17</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gilbert</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Field</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Edwards</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Gilna</surname> <given-names>P.</given-names>
</name>
<etal/>
</person-group>. (<year>2008</year>). <article-title>Detection of Large Numbers of Novel Sequences in the Metatranscriptomes of Complex Marine Microbial Communities</article-title>. <source>PloS One</source>  <volume>3</volume>(<issue>8</issue>):<elocation-id>e3042</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0003042</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gong</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Browne</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hall</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Schruth</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Paerl</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Marchetti</surname> <given-names>A</given-names>
</name>
</person-group> (<year>2017</year>) Molecular Insights Into a Dinoflagellate Bloom. <source>ISME J</source> <volume>11</volume>, <page-range>439&#x2013;52</page-range>. doi: <pub-id pub-id-type="doi">10.1038/ismej.2016.129</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gong</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Paerl</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Marchetti</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Eukaryotic Phytoplankton Community Spatiotemporal Dynamics as Identified Through Gene Expression Within a Eutrophic Estuary</article-title>. <source>Environ. Microbiol</source> <volume>20</volume>(<issue>3</issue>), <page-range>1095&#x2013;111</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/1462-2920.14049</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grabherr</surname> <given-names>M. G.</given-names>
</name>
<name>
<surname>Haas</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Yassour</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Levin</surname> <given-names>J. Z.</given-names>
</name>
<name>
<surname>Thompson</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Amit</surname> <given-names>I.</given-names>
</name>
<etal/>
</person-group>. (<year>2011</year>). <article-title>Full-Length Transcriptome Assembly From RNA-Seq Data Without a Reference Genome</article-title>. <source>Nat. Biotech.</source> <volume>29</volume>, <fpage>644</fpage>&#x2013;<lpage>652</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Groussman</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Coesel</surname> <given-names>S. N.</given-names>
</name>
<name>
<surname>Durham</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Armbrust</surname> <given-names>E. V.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Diel-Regulated Transcriptional Cascades of Microbial Eukaryotes in the North Pacific Subtropical Gyre</article-title>. <source>Front. Microbiol.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2021.682651</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Harke</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Frischkorn</surname> <given-names>K. R.</given-names>
</name>
<name>
<surname>Hennon</surname> <given-names>G. M. M.</given-names>
</name>
<name>
<surname>Haley</surname> <given-names>S. T.</given-names>
</name>
<name>
<surname>Barone</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Karl</surname> <given-names>D. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Microbial Community Transcriptional Patterns Vary in Response to Mesoscale Forcing in the North Pacific Subtropical Gyre</article-title>. <source>Environ. Microbiol.</source> <volume>23</volume> (<issue>8</issue>), <fpage>4807</fpage>&#x2013;<lpage>4822</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/1462-2920.15677</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heal</surname> <given-names>K. R.</given-names>
</name>
<name>
<surname>Durham</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Boysen</surname> <given-names>A. K.</given-names>
</name>
<name>
<surname>Carlson</surname> <given-names>L. T.</given-names>
</name>
<name>
<surname>Qin</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Ribalet</surname> <given-names>F.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Marine Community Metabolomes Carry Fingerprints of Phytoplankton Community Composition</article-title>. <source>mSystems</source> <volume>6</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/mSystems.01334-20</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hogle</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>Hackl</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Bundy</surname> <given-names>R. M.</given-names>
</name>
<name>
<surname>Park</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Braakman</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Satinsky</surname> <given-names>B.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Siderophores as an Iron Source for Prochlorococcus in Deep Chlorophyll Maximum Layers of the Oligotrophic Ocean</article-title>. <source>ISME J</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41396-022-01215-w</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Herrera</surname> <given-names>E. L.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>A. R.</given-names>
</name>
<name>
<surname>Pachiadaki</surname> <given-names>M. G.</given-names>
</name>
<name>
<surname>Edgcomb</surname> <given-names>V. P.</given-names>
</name>
<name>
<surname>Sylva</surname> <given-names>S. P.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Protistan Grazing Impacts Microbial Communities and Carbon Cycling at Deep-Sea Hydrothermal Vents</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>118</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2102674118</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Alexander</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Campbell</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Connell</surname> <given-names>P. E.</given-names>
</name>
<name>
<surname>Dyhrman</surname> <given-names>S. T.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Shifting Metabolic Priorities Among Key Protistan Taxa Within and Below the Euphotic Zone</article-title>. <source>Environ. Microbiol.</source> <volume>20</volume>, <fpage>2865</fpage>&#x2013;<lpage>2879</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/1462-2920.14259</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hussing</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Kampmann</surname> <given-names>M.-L.</given-names>
</name>
<name>
<surname>Mogensen</surname> <given-names>H. S.</given-names>
</name>
<name>
<surname>B&#xf8;rsting</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Morling</surname> <given-names>N.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Quantification of Massively Parallel Sequencing Libraries &#x2013; A&#xa0;Comparative Study of Eight Methods</article-title>. <source>Sci. Rep.</source> <volume>8</volume>, <fpage>1110</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-018-19574-w</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ji</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Metatranscriptome Analysis Reveals Environmental and Diel Regulation of a Heterosigma Akashiwo (Raphidophyceae) Bloom</article-title>. <source>Environ. Microbiol</source> <volume>20</volume> (<issue>3</issue>), <page-range>1078&#x2013;94</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/1462-2920.14045</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname> <given-names>L. K.</given-names>
</name>
<name>
<surname>Alexander</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Brown</surname> <given-names>C. T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Re-Assembly, Quality Evaluation, and Annotation of 678 Microbial Eukaryotic Reference Transcriptomes</article-title>. <source>Gigascience</source> <volume>8</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gigascience/giy158</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jones</surname> <given-names>L. J.</given-names>
</name>
<name>
<surname>Yue</surname> <given-names>S. T.</given-names>
</name>
<name>
<surname>Cheung</surname> <given-names>C. Y.</given-names>
</name>
<name>
<surname>Singer</surname> <given-names>V. L.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>RNA Quantitation by Fluorescence-Based Solution Assay: RiboGreen Reagent Characterization</article-title>. <source>Anal. Biochem</source> <volume>265</volume>(<issue>2</issue>), <page-range>368&#x2013;74</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1006/abio.1998.2914</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kanehisa</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sato</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Kawashima</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Furumichi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Tanabe</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>a). <article-title>KEGG as a Reference Resource for Gene and Protein Annotation</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume>, <fpage>D457</fpage>&#x2013;<lpage>D462</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkv1070</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kanehisa</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sato</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Morishima</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2016</year>b). <article-title>BlastKOALA and GhostKOALA: KEGG Tools for Functional Characterization of Genome and Metagenome Sequences</article-title>. <source>J. Mol. Biol.</source> <volume>428</volume>, <fpage>726</fpage>&#x2013;<lpage>731</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jmb.2015.11.006</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Keeling</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Burki</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Wilcox</surname> <given-names>H. M.</given-names>
</name>
<name>
<surname>Allam</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>E. E.</given-names>
</name>
<name>
<surname>Amaral-Zettler</surname> <given-names>L. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>The Marine Microbial Eukaryote Transcriptome Sequencing Project (MMETSP): Illuminating the Functional Diversity of Eukaryotic Life in the Oceans Through Transcriptome Sequencing</article-title>. <source>PloS Biol.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pbio.1001889</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kerkhof</surname> <given-names>L. J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Is Oxford Nanopore Sequencing Ready for Analyzing Complex Microbiomes</article-title>? <source>FEMS Microbiol. Ecol.</source> <volume>97</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/femsec/fiab001</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Klemetsen</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Raknes</surname> <given-names>I. A.</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Agafonov</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Balasundaram</surname> <given-names>S. V.</given-names>
</name>
<name>
<surname>Tartari</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>The MAR Databases: Development and Implementation of Databases Specific for Marine Metagenomics</article-title>. <source>Nucleic Acids Res.</source> <volume>46</volume>, <fpage>D692</fpage>&#x2013;<lpage>D699</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkx1036</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Klingenberg</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Meinicke</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>How To Normalize Metatranscriptomic Count Data For Differential Expression Analysis</article-title>. <source>PeerJ</source> <volume>5</volume>:<elocation-id>e3859</elocation-id>. doi: <pub-id pub-id-type="doi">10.7717/peerj.3859</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kolmogorov</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Bickhart</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Behsaz</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Gurevich</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Rayko</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Shin</surname> <given-names>S. B.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Metaflye: Scalable Long-Read Metagenome Assembly Using Repeat Graphs</article-title>. <source>Nat. Methods</source> <volume>17</volume>, <page-range>1103&#x2013;10</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41592-020-00971-x</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kolody</surname> <given-names>B. C.</given-names>
</name>
<name>
<surname>Harke</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Hook</surname> <given-names>S. E.</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>A. E.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>&#x201c;Chapter 13 - Transcriptomic and Metatranscriptomic Approaches in Phytoplankton: Insights and Advances,&#x201d;</article-title> in, <person-group person-group-type="editor">
<name>
<surname>Clementson</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Eriksen</surname> <given-names>R. S.</given-names>
</name>
</person-group>eds. A. B. T.-A. in P. E. Willis (<publisher-name>Elsevier</publisher-name>) <volume>4</volume>, <fpage>435</fpage>&#x2013;<lpage>485</lpage>.  doi: <pub-id pub-id-type="doi">10.1016/B978-0-12-822861-6.00022-4</pub-id>.</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kolody</surname> <given-names>B. C.</given-names>
</name>
<name>
<surname>McCrow</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>L. Z.</given-names>
</name>
<name>
<surname>Aylward</surname> <given-names>F. O.</given-names>
</name>
<name>
<surname>Fontanez</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Moustafa</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Diel Transcriptional Response of a California Current Plankton Microbiome to Light, Low Iron, and Enduring Viral Infection</article-title>. <source>ISME J</source> <volume>13</volume>, <page-range>2817&#x2013;33</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41396-019-0472-2</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kopylova</surname> <given-names>E.</given-names>
</name>
<name>
<surname>No&#xe9;</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Touzet</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>SortMeRNA: Fast and Accurate Filtering of Ribosomal RNAs in Metatranscriptomic Data</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <issue>24</issue>, <page-range>3211&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts611</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>K&#xf6;ster</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Rahmann</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Snakemake&#x2013;A Scalable Bioinformatics Workflow Engine</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>2520</fpage>&#x2013;<lpage>2522</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts480</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krinos</surname> <given-names>A. I.</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>N. R.</given-names>
</name>
<name>
<surname>Follows</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Alexander</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Reverse Engineering Environmental Metatranscriptomes Clarifies Best Practices for Eukaryotic Assembly</article-title>. <source>bioRxiv</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2022.04.25.489326</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krinos</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Alexander</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>EUKulele: Taxonomic Annotation of the Unsung Eukaryotic Microbes</article-title>. <source>J. Open Source Software</source> <volume>6</volume>, <elocation-id>2817</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.21105/joss.02817</pub-id>
</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lambert</surname> <given-names>B. S.</given-names>
</name>
<name>
<surname>Groussman</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Schatz</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Coesel</surname> <given-names>S. N.</given-names>
</name>
<name>
<surname>Durham</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Alverson</surname> <given-names>A. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>The Dynamic Trophic Architecture of Open-Ocean Protist Communities Revealed Through Machine-Guided Metatranscriptomics</article-title>. <source>Proc. Nat. Acad. Sci. U.S.A.</source> <volume>119</volume>(<issue>7</issue>), <elocation-id>e2100916119</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2100916119</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lampe</surname> <given-names>R. H.</given-names>
</name>
<name>
<surname>Mann</surname> <given-names>E. L.</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>N. R.</given-names>
</name>
<name>
<surname>Till</surname> <given-names>C. P.</given-names>
</name>
<name>
<surname>Thamatrakoln</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Brzezinski</surname> <given-names>M. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Different Iron Storage Strategies Among Bloom-Forming Diatoms</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>115</volume>, <fpage>E12275</fpage>&#x2013;<lpage>E12284</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1805243115</pub-id>
</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Langfelder</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Horvath</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>WGCNA: An R Package for Weighted Correlation Network Analysis</article-title>. <source>BMC Bioinf.</source> <volume>9</volume>, <elocation-id>559</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2105-9-559</pub-id>
</citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Langmead</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Salzberg</surname> <given-names>S. L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Fast Gapped-Read Alignment With Bowtie 2</article-title>. <source>Nat. Methods</source> <volume>9</volume>, <fpage>357</fpage>&#x2013;<lpage>359</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.1923</pub-id>
</citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lanz&#xe9;n</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Simachew</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Gessesse</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Chmolowska</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Jonassen</surname> <given-names>I.</given-names>
</name>
<name>
<surname>&#xd8;vre&#xe5;s</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Surprising Prokaryotic and Eukaryotic Diversity, Community Structure and Biogeography of Ethiopian Soda Lakes</article-title>. <source>PloS One</source> <volume>8</volume>(<issue>8</issue>) <elocation-id>e72577</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0072577</pub-id>
</citation>
</ref>
<ref id="B86">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lau</surname> <given-names>M. C. Y.</given-names>
</name>
<name>
<surname>Harris</surname> <given-names>R. L.</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yi</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Behmard</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Onstott</surname> <given-names>T. C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Taxonomic and Functional Compositions Impacted by the Quality of Metatranscriptomic Assemblies</article-title>. <source>Front. Microbiol.</source> <volume>9</volume>, <elocation-id>1235</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2018.01235</pub-id>
</citation>
</ref>
<ref id="B87">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Law</surname> <given-names>C. W.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Smyth</surname> <given-names>G. K.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Voom: Precision Weights Unlock Linear Model Analysis Tools for RNA-Seq Read Counts</article-title>. <source>Genome Biol.</source> <volume>15</volume>, <fpage>R29</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/gb-2014-15-2-r29</pub-id>
</citation>
</ref>
<ref id="B88">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Durbin</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Fast and Accurate Short Read Alignment With Burrows&#x2013;Wheeler Transform</article-title>. <source>Bioinformatics</source> <volume>25</volume>, <fpage>1754</fpage>&#x2013;<lpage>1760</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btp324</pub-id>
</citation>
</ref>
<ref id="B89">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Godzik</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Cd-Hit: A Fast Program for Clustering and Comparing Large Sets of Protein or Nucleotide Sequences</article-title>. <source>Bioinformatics</source> <volume>22</volume>, <fpage>1658</fpage>&#x2013;<lpage>1659</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btl158</pub-id>
</citation>
</ref>
<ref id="B90">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C.-M.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Sadakane</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Lam</surname> <given-names>T.-W.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>MEGAHIT: An Ultra-Fast Single-Node Solution for Large and Complex Metagenomics Assembly <italic>via</italic> Succinct De Bruijn Graph</article-title>. <source>Bioinformatics</source> <volume>31</volume>, <fpage>1674</fpage>&#x2013;<lpage>1676</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btv033</pub-id>
</citation>
</ref>
<ref id="B91">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Stoeckert</surname> <given-names>C. J.</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Roos</surname> <given-names>D. S.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>OrthoMCL: Identification of Ortholog Groups for Eukaryotic Genomes</article-title>. <source>Genome Res.</source> <volume>13</volume>, <fpage>2178</fpage>&#x2013;<lpage>2189</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.1224503</pub-id>
</citation>
</ref>
<ref id="B92">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>N.</given-names>
</name>
<name>
<surname>He</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Pong</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Comparison of Next-Generation Sequencing Systems</article-title>. <source>J. Biomed. Biotechnol.</source> <volume>2012</volume>, <elocation-id>251364</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2012/251364</pub-id>
</citation>
</ref>
<ref id="B93">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lo Giudice Cappelli</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Austin</surname> <given-names>W. E. N.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Size Matters: Analyses of Benthic Foraminiferal Assemblages Across Differing Size Fractions</article-title>. <source>Front. Mar. Sci.</source> <volume>6</volume>, <elocation-id>752</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2019.00752</pub-id>
</citation>
</ref>
<ref id="B94">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Love</surname> <given-names>M. I.</given-names>
</name>
<name>
<surname>Huber</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Anders</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Moderated Estimation of Fold Change and Dispersion for RNA-Seq Data With Deseq2</article-title>. <source>Genome Biol.</source> <volume>15</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-014-0550-8</pub-id>
</citation>
</ref>
<ref id="B95">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>MacManes</surname> <given-names>M. D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>On the Optimal Trimming of High-Throughput mRNA Sequence Data</article-title>. <source>Front. Genet</source> <volume>5</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fgene.2014.00013</pub-id>
</citation>
</ref>
<ref id="B96">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mallick</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Chatterjee</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chowdhury</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chatterjee</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Rahnavard</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hicks</surname> <given-names>S. C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Differential Expression of Single-Cell RNA-Seq Data Using Tweedie Models</article-title>. <source>bioRxiv</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2021.03.28.437378</pub-id>
</citation>
</ref>
<ref id="B97">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marchetti</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A Global Perspective on Iron and Plankton Through the Tara Oceans Lens</article-title>. <source>Global Biogeochem. Cycle</source> <volume>33</volume>, <page-range>239&#x2013;42</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2019GB006181</pub-id>
</citation>
</ref>
<ref id="B98">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marchetti</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Schruth</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Durkin</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Parker</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Kodner</surname> <given-names>R. B.</given-names>
</name>
<name>
<surname>Berthiaume</surname> <given-names>C. T.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Comparative Metatranscriptomics Identifies Molecular Bases for the Physiological Responses of Phytoplankton to Varying Iron Availability</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>109</volume>(<issue>6</issue>), <fpage>E317</fpage>&#x2013;<lpage>E325</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1118408109</pub-id>
</citation>
</ref>
<ref id="B99">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marguerat</surname> <given-names>S.</given-names>
</name>
<name>
<surname>B&#xe4;hler</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Coordinating Genome Expression With Cell Size</article-title>. <source>Trends Genet.</source> <volume>28</volume> (<issue>11</issue>), <fpage>560</fpage>&#x2013;<lpage>565</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tig.2012.07.003</pub-id>
</citation>
</ref>
<ref id="B100">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martin</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Cutadapt Removes Adapter Sequences From High-Throughput Sequencing Reads</article-title>. <source>EMBnet.journal</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.14806/ej.17.1.200</pub-id>
</citation>
</ref>
<ref id="B101">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McCarren</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Becker</surname> <given-names>J. W.</given-names>
</name>
<name>
<surname>Repeta</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Young</surname> <given-names>C. R.</given-names>
</name>
<name>
<surname>Malmstrom</surname> <given-names>R. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2010</year>). <article-title>Microbial Community Transcriptomes Reveal Microbes and Metabolic Pathways Associated With Dissolved Organic Matter Turnover in the Sea</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>107</volume>, <fpage>16420</fpage>&#x2013;<lpage>16427</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1010732107</pub-id>
</citation>
</ref>
<ref id="B102">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Metegnier</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Paulino</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ramond</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Siano</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Sourisseau</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Destombe</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Species Specific Gene Expression Dynamics During Harmful Algal Blooms</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>6182</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-020-63326-8</pub-id>
</citation>
</ref>
<ref id="B103">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mortazavi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>B. A.</given-names>
</name>
<name>
<surname>McCue</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Schaeffer</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wold</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Mapping and Quantifying Mammalian Transcriptomes by RNA-Seq</article-title>. <source>Nat. Methods</source> <volume>5</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.1226</pub-id>
</citation>
</ref>
<ref id="B104">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muir</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lou</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Spakowicz</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Salichos</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>The Real Cost of Sequencing: Scaling Computation to Keep Pace With Data Generation</article-title>. <source>Genome Biol.</source> <volume>17</volume>, <fpage>53</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-016-0917-0</pub-id>
</citation>
</ref>
<ref id="B105">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mukherjee</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Reddy</surname> <given-names>M. S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Metatranscriptomics: An Approach for Retrieving Novel Eukaryotic Genes From Polluted and Related Environments</article-title>. <source>3. Biotech.</source> <volume>10</volume>, <fpage>71</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s13205-020-2057-1</pub-id>
</citation>
</ref>
<ref id="B106">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muratore</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Boysen</surname> <given-names>A. K.</given-names>
</name>
<name>
<surname>Harke</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Becker</surname> <given-names>K. W.</given-names>
</name>
<name>
<surname>Casey</surname> <given-names>J. R.</given-names>
</name>
<name>
<surname>Coesel</surname> <given-names>S. N.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Complex Marine Microbial Communities Partition Metabolism of Scarce Resources Over the Diel Cycle</article-title>. <source>Nat. Ecol. Evol</source> <volume>6</volume>, <page-range>218&#x2013;29</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41559-021-01606-w</pub-id>
</citation>
</ref>
<ref id="B107">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Omori</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Ikeda</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>1992</year>). <source>Methods in Marine Zooplankton Ecology</source> (<publisher-loc>Florida</publisher-loc>: <publisher-name>Krieger Plubishing Company</publisher-name>).</citation>
</ref>
<ref id="B108">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ortiz</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Gera</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Rivera</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Santos</surname> <given-names>J. C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Pincho: A Modular Approach to High Quality <italic>De Novo</italic> Transcriptomics</article-title>. <source>Genes (Basel)</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/genes12070953</pub-id>
</citation>
</ref>
<ref id="B109">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ottesen</surname> <given-names>E. A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Probing the Living Ocean With Ecogenomic Sensors</article-title>. <source>Curr. Opin. Microbiol</source> <volume>31</volume>, <page-range>132&#x2013;9</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.mib.2016.03.012</pub-id>
</citation>
</ref>
<ref id="B110">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Padilla</surname> <given-names>C. C.</given-names>
</name>
<name>
<surname>Ganesh</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Gantt</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Huhman</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Parris</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Sarode</surname> <given-names>N.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Standard Filtration Practices may Significantly Distort Planktonic Microbial Diversity Estimates</article-title>. <source>Front. Microbiol.</source> <volume>6</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2015.00547</pub-id>
</citation>
</ref>
<ref id="B111">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Passow</surname> <given-names>C. N.</given-names>
</name>
<name>
<surname>Kono</surname> <given-names>T. J. Y.</given-names>
</name>
<name>
<surname>Stahl</surname> <given-names>B. A.</given-names>
</name>
<name>
<surname>Jaggard</surname> <given-names>J. B.</given-names>
</name>
<name>
<surname>Keene</surname> <given-names>A. C.</given-names>
</name>
<name>
<surname>McGaugh</surname> <given-names>S. E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Nonrandom RNAseq Gene Expression Associated With RNAlater and Flash Freezing Storage Methods</article-title>. <source>Mol. Ecol. Resour</source> <volume>19</volume>(<issue>2</issue>):<page-range>456&#x2013;64</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/1755-0998.12965</pub-id>
</citation>
</ref>
<ref id="B112">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Patro</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Duggal</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Love</surname> <given-names>M. I.</given-names>
</name>
<name>
<surname>Irizarry</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Kingsford</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Salmon Provides Fast and Bias-Aware Quantification of Transcript Expression</article-title>. <source>Nat. Methods</source> <volume>14</volume>, <fpage>417</fpage>&#x2013;<lpage>419</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.4197</pub-id>
</citation>
</ref>
<ref id="B113">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pearson</surname> <given-names>G. A.</given-names>
</name>
<name>
<surname>Lago-Leston</surname> <given-names>A.</given-names>
</name>
<name>
<surname>C&#xe1;novas</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Cox</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Verret</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Lasternas</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Metatranscriptomes Reveal Functional Variation in Diatom Communities From the Antarctic Peninsula</article-title>. <source>ISME J.</source> <volume>9</volume>, <fpage>2275</fpage>&#x2013;<lpage>2289</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ismej.2015.40</pub-id>
</citation>
</ref>
<ref id="B114">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Leung</surname> <given-names>H. C. M.</given-names>
</name>
<name>
<surname>Yiu</surname> <given-names>S.-M.</given-names>
</name>
<name>
<surname>Lv</surname> <given-names>M.-J.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>X.-G.</given-names>
</name>
<name>
<surname>Chin</surname> <given-names>F. Y. L.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>IDBA-Tran: A More Robust <italic>De Novo</italic> De Bruijn Graph Assembler for Transcriptomes With Uneven Expression Levels</article-title>. <source>Bioinformatics</source> <volume>29</volume>, <fpage>i326</fpage>&#x2013;<lpage>i334</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btt219</pub-id>
</citation>
</ref>
<ref id="B115">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pesant</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Not</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Picheral</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kandels-Lewis</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Le Bescot</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Gorsky</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Open Science Resources for the Discovery and Analysis of Tara Oceans Data</article-title>. <source>Sci. Data</source> <volume>2</volume>, <fpage>150023</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/sdata.2015.23</pub-id>
</citation>
</ref>
<ref id="B116">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prjibelski</surname> <given-names>A. D.</given-names>
</name>
<name>
<surname>Puglia</surname> <given-names>G. D.</given-names>
</name>
<name>
<surname>Antipov</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Bushmanova</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Giordano</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Mikheenko</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Extending Rnaspades Functionality for Hybrid Transcriptome Assembly</article-title>. <source>BMC Bioinf</source> <volume>21</volume>(<issue>302</issue>). doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12859-020-03614-2</pub-id>
</citation>
</ref>
<ref id="B117">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Rabines</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lampe</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>A. E.</given-names>
</name>
</person-group> (<year>2020</year>a). <source>Sterivex RNA Extraction</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.17504/protocols.io.bd9ti96n</pub-id>
</citation>
</ref>
<ref id="B118">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Rabines</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lampe</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Zeigler Allen</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>A. E.</given-names>
</name>
</person-group> (<year>2020</year>b). <source>NOAA-CalCOFI Ocean Genomics (NCOG) Sample Collection</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.17504/protocols.io.bmubk6sn</pub-id>
</citation>
</ref>
<ref id="B119">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ramette</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Multivariate Analyses in Microbial Ecology</article-title>. <source>FEMS Microbiol. Ecol.</source> <volume>62</volume>, <fpage>142</fpage>&#x2013;<lpage>160</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1574-6941.2007.00375.x</pub-id>
</citation>
</ref>
<ref id="B120">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rao</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2020</year>) <article-title>Characterizing Cobalamin Cycling by Antarctic Marine Microbes Across Multiple Scales</article-title> doi: <pub-id pub-id-type="doi">10.1575/1912/25832</pub-id>
</citation>
</ref>
<ref id="B121">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reiner</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Yekutieli</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Benjamini</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Identifying Differentially Expressed Genes Using False Discovery Rate Controlling Procedures</article-title>. <source>Bioinformatics</source> <volume>19</volume>, <fpage>368</fpage>&#x2013;<lpage>375</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btf877</pub-id>
</citation>
</ref>
<ref id="B122">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Richter</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Berney</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Strassert</surname> <given-names>J. F.H.</given-names>
</name>
<name>
<surname>Burki</surname> <given-names>F.</given-names>
</name>
<name>
<surname>de Vargas</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>EukProt: A Database of Genome-Scale Predicted Proteins Across the Diversity of Eukaryotic Life</article-title>. <source>bioRxiv</source> doi: <pub-id pub-id-type="doi">10.1101/2020.06.30.180687</pub-id>.</citation>
</ref>
<ref id="B123">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robertson</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Schein</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Chiu</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Corbett</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Field</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Jackman</surname> <given-names>S. D.</given-names>
</name>
<etal/>
</person-group>. (<year>2010</year>). <article-title>
<italic>De Novo</italic> Assembly and Analysis of RNA-Seq Data</article-title>. <source>Nat. Methods</source> <volume>7</volume>, <fpage>909</fpage>&#x2013;<lpage>912</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.1517</pub-id>
</citation>
</ref>
<ref id="B124">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robinson</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>McCarthy</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Smyth</surname> <given-names>G. K.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Edger: A Bioconductor Package for Differential Expression Analysis of Digital Gene Expression Data</article-title>. <source>Bioinformatics</source> <volume>26</volume>, <fpage>139</fpage>&#x2013;<lpage>140</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btp616</pub-id>
</citation>
</ref>
<ref id="B125">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Robinson</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>Oshlack</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>A Scaling Normalization Method for Differential Expression Analysis of RNA-Seq Data</article-title>. <source>Genome Biol.</source> <volume>11</volume>, <fpage>R25</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/gb-2010-11-3-r25</pub-id>
</citation>
</ref>
<ref id="B126">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rusch</surname> <given-names>D. B.</given-names>
</name>
<name>
<surname>Halpern</surname> <given-names>A. L.</given-names>
</name>
<name>
<surname>Sutton</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Heidelberg</surname> <given-names>K. B.</given-names>
</name>
<name>
<surname>Williamson</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Yooseph</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2007</year>). <article-title>The Sorcerer II Global Ocean Sampling Expedition: Northwest Atlantic Through Eastern Tropical Pacific</article-title>. <source>PloS Biol.</source> <volume>5</volume>, <fpage>1</fpage>&#x2013;<lpage>34</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pbio.0050077</pub-id>
</citation>
</ref>
<ref id="B127">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saito</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>McIlvin</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Goepfert</surname> <given-names>T. J.</given-names>
</name>
<name>
<surname>DiTullio</surname> <given-names>G. R.</given-names>
</name>
<name>
<surname>Post</surname> <given-names>A. F.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>Multiple Nutrient Stresses at Intersecting Pacific Ocean Biomes Detected by Protein Biomarkers</article-title>. <source>Science</source> <volume>345</volume>(<issue>6201</issue>):<page-range>1173&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1256450</pub-id>
</citation>
</ref>
<ref id="B128">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saito</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>McIlvin</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Santoro</surname> <given-names>A. E.</given-names>
</name>
<name>
<surname>Dupont</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Rafter</surname> <given-names>P. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Abundant Nitrite-Oxidizing Metalloenzymes in the Mesopelagic Zone of the Tropical Pacific Ocean</article-title>. <source>Nat. Geosci.</source> <volume>13</volume>, <fpage>355</fpage>&#x2013;<lpage>362</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41561-020-0565-6</pub-id>
</citation>
</ref>
<ref id="B129">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sandve</surname> <given-names>G. K.</given-names>
</name>
<name>
<surname>Nekrutenko</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Taylor</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hovig</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Ten Simple Rules for Reproducible Computational Research</article-title>. <source>PloS Comput. Biol.</source> <volume>9</volume>, <fpage>1</fpage>&#x2013;<lpage>4</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pcbi.1003285</pub-id>
</citation>
</ref>
<ref id="B130">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Santoro</surname> <given-names>A. E.</given-names>
</name>
<name>
<surname>Saito</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Goepfert</surname> <given-names>T. J.</given-names>
</name>
<name>
<surname>Lamborg</surname> <given-names>C. H.</given-names>
</name>
<name>
<surname>Dupont</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>DiTullio</surname> <given-names>G. R.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Thaumarchaeal Ecotype Distributions Across the Equatorial Pacific Ocean and Their Potential Roles in Nitrification and Sinking Flux Attenuation</article-title>. <source>Limnol. Oceanogr.</source> <volume>62</volume>, <fpage>1984</fpage>&#x2013;<lpage>2003</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/lno.10547</pub-id>
</citation>
</ref>
<ref id="B131">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Satinsky</surname> <given-names>B. M.</given-names>
</name>
<name>
<surname>Gifford</surname> <given-names>S. M.</given-names>
</name>
<name>
<surname>Crump</surname> <given-names>B. C.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>M. A.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Use of Internal Standards for Quantitative Metatranscriptome and Metagenome Analysis</article-title>. <source>Methods Enzymol.</source> <volume>531</volume>, <fpage>237</fpage>&#x2013;<lpage>250</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/B978-0-12-407863-5.00012-5</pub-id>
</citation>
</ref>
<ref id="B132">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Satinsky</surname> <given-names>B. M.</given-names>
</name>
<name>
<surname>Gifford</surname> <given-names>S. M.</given-names>
</name>
<name>
<surname>Crump</surname> <given-names>B. C.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>M. A.</given-names>
</name>
</person-group> (<year>2017</year>). <source>Internal Genomic DNA Standard for Quantitative Metagenome Analysis V.3</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.17504/protocols.io.jxdcpi6</pub-id>
</citation>
</ref>
<ref id="B133">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Schlitzer</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <source>Ocean Data View User&#x2019;s Guide</source>.</citation>
</ref>
<ref id="B134">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schoenle</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hohlfeld</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hermanns</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Mah&#xe9;</surname> <given-names>F.</given-names>
</name>
<name>
<surname>de Vargas</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Nitsche</surname> <given-names>F.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>High and Specific Diversity of Protists in the Deep-Sea Basins Dominated by Diplonemids, Kinetoplastids, Ciliates and Foraminiferans</article-title>. <source>Commun. Biol.</source> <volume>4</volume>, <fpage>501</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s42003-021-02012-5</pub-id>
</citation>
</ref>
<ref id="B135">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scholin</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Birch</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Jensen</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Marin</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Massion</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Pargett</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>The Quest to Develop Ecogenomic Sensors a 25-Year History of the Environmental Sample Processor (ESP) as a Case Study</article-title>. <source>Oceanography</source> <volume>30</volume>(<issue>4</issue>):<page-range>100&#x2013;13</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.5670/OCEANOG.2017.427</pub-id>
</citation>
</ref>
<ref id="B136">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schroeder</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Mueller</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Stocker</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Salowsky</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Leiber</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Gassmann</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2006</year>). <article-title>The RIN: An RNA Integrity Number for Assigning Integrity Values to RNA Measurements</article-title>. <source>BMC Mol. Biol.</source> <volume>7</volume>, <elocation-id>3</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2199-7-3</pub-id>
</citation>
</ref>
<ref id="B137">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Semmouri</surname> <given-names>I.</given-names>
</name>
<name>
<surname>De Schamphelaere</surname> <given-names>K. A.C.</given-names>
</name>
<name>
<surname>Mees</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Janssen</surname> <given-names>C. R.</given-names>
</name>
<name>
<surname>and Asselman</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Evaluating the Potential of Direct RNA Nanopore Sequencing: Metatranscriptomics Highlights Possible Seasonal Differences in a Marine Pelagic Crustacean Zooplankton Community</article-title>. <source>Mar. Environ. Res</source>. doi: <pub-id pub-id-type="doi">10.1016/j.marenvres.2019.104836</pub-id>.</citation>
</ref>
<ref id="B138">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shakya</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Lo</surname> <given-names>C.-C.</given-names>
</name>
<name>
<surname>Chain</surname> <given-names>P. S. G.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Advances and Challenges in Metatranscriptomic Analysis</article-title>. <source>Front. Genet.</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fgene.2019.00904</pub-id>
</citation>
</ref>
<ref id="B139">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shannon</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Markiel</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Ozier</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Baliga</surname> <given-names>N. S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J. T.</given-names>
</name>
<name>
<surname>Ramage</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2003</year>). <article-title>Cytoscape: A Software Environment for Integrated Models of Biomolecular Interaction Networks</article-title>. <source>Genome Res.</source> <volume>13</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.1239303</pub-id>
</citation>
</ref>
<ref id="B140">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>McCarren</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Delong</surname> <given-names>E. F.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Transcriptional Responses of Surface Water Marine Microbial Assemblages to Deep-Sea Water Amendment</article-title>. <source>Environ. Microbiol</source> <volume>14</volume>(<issue>1</issue>):<fpage>191</fpage>&#x2013;<lpage>206</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1462-2920.2011.02598.x</pub-id>
</citation>
</ref>
<ref id="B141">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname> <given-names>D. R.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>RNA-Seq Data: A Goldmine for Organelle Research</article-title>. <source>Brief. Funct. Genomics</source> <volume>12</volume>, <fpage>454</fpage>&#x2013;<lpage>456</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bfgp/els066</pub-id>
</citation>
</ref>
<ref id="B142">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Soneson</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Love</surname> <given-names>M. I.</given-names>
</name>
<name>
<surname>Robinson</surname> <given-names>M. D.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Differential Analyses for RNA-Seq: Transcript-Level Estimates Improve Gene-Level Inferences</article-title>. <source>F1000Research</source> <volume>4</volume>, <fpage>1521</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.12688/f1000research.7563.2</pub-id>
</citation>
</ref>
<ref id="B143">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Milon</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Ott</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Sadzewicz</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Shetty</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>A Comparative Analysis of Library Prep Approaches for Sequencing Low Input Translatome Samples</article-title>. <source>BMC Genomics</source> <volume>19</volume>, <fpage>696</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-018-5066-2</pub-id>
</citation>
</ref>
<ref id="B144">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sperfeld</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Yahalomi</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Segev</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Resolving the Microalgal Gene Landscape at the Strain Level: A Novel Hybrid Transcriptome of Emiliania Huxleyi CCMP3266</article-title>. <source>Appl. Environ. Microbiol.</source> <volume>88</volume>(<issue>2</issue>):<elocation-id>e0141821</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/AEM.01418-21</pub-id>
</citation>
</ref>
<ref id="B145">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Steinegger</surname> <given-names>M.</given-names>
</name>
<name>
<surname>S&#xf6;ding</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>MMseqs2 Enables Sensitive Protein Sequence Searching for the Analysis of Massive Data Sets</article-title>. <source>Nat. Biotechnol.</source> <volume>35</volume>, <fpage>1026</fpage>&#x2013;<lpage>1028</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nbt.3988</pub-id>
</citation>
</ref>
<ref id="B146">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stewart</surname> <given-names>F. J.</given-names>
</name>
<name>
<surname>Ottesen</surname> <given-names>E. A.</given-names>
</name>
<name>
<surname>DeLong</surname> <given-names>E. F.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Development and Quantitative Analyses of a Universal rRNA-Subtraction Protocol for Microbial Metatranscriptomics</article-title>. <source>ISME J.</source> <volume>4</volume>, <fpage>896</fpage>&#x2013;<lpage>907</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ismej.2010.18</pub-id>
</citation>
</ref>
<ref id="B147">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Q.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Combination Analysis of Metatranscriptome and Metagenome Reveal the Composition and Functional Response of Coral Symbionts to Bleaching During an El Ni&#xf1;o Event</article-title>. <source>Front. Microbiol.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2020.00448</pub-id>
</citation>
</ref>
<ref id="B148">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tamames</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Puente-S&#xe1;nchez</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>SqueezeMeta, a Highly Portable, Fully Automatic Metagenomic Analysis Pipeline</article-title>. <source>Front. Microbiol.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2018.03349</pub-id>
</citation>
</ref>
<ref id="B149">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lomsadze</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Borodovsky</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Identification of Protein Coding Regions in RNA Transcripts</article-title>. <source>Nucleic Acids Res.</source> <volume>43</volume>(<issue>12</issue>), <elocation-id>e78</elocation-id>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkv227</pub-id>
</citation>
</ref>
<ref id="B150">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tatusov</surname> <given-names>R. L.</given-names>
</name>
<name>
<surname>Fedorova</surname> <given-names>N. D.</given-names>
</name>
<name>
<surname>Jackson</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Jacobs</surname> <given-names>A. R.</given-names>
</name>
<name>
<surname>Kiryutin</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Koonin</surname> <given-names>E. V.</given-names>
</name>
<etal/>
</person-group>. (<year>2003</year>). <article-title>The COG Database: An Updated Version Includes Eukaryotes</article-title>. <source>BMC Bioinf.</source> <volume>4</volume>, <elocation-id>41</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2105-4-41</pub-id>
</citation>
</ref>
<ref id="B151">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tully</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Buongiorno</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>A. B.</given-names>
</name>
<name>
<surname>Cram</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Garber</surname> <given-names>A. I.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>S. K.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>The Bioinformatics Virtual Coordination Network: An Open-Source and Interactive Learning Environment</article-title>. <source>Front. Educ.</source> <volume>6</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/feduc.2021.711618</pub-id>
</citation>
</ref>
<ref id="B152">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>van Damme</surname> <given-names>R.</given-names>
</name>
<name>
<surname>H&#xf6;lzer</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Viehweger</surname> <given-names>A.</given-names>
</name>
<name>
<surname>M&#xfc;ller</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Bongcam-Rudloff</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Brandt</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Metagenomics Workflow for Hybrid Assembly, Differential Coverage Binning, Metatranscriptomics and Pathway Analysis (MUFFIN)</article-title>. <source>PloS Comput. Biol.</source> <volume>17</volume>(<issue>2</issue>): <elocation-id>e1008716</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/JOURNAL.PCBI.1008716</pub-id>
</citation>
</ref>
<ref id="B153">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>van Dongen</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Performance Criteria for Graph Clustering and Markov Cluster Experiments</article-title>. <source>Tech. Rep. INS-R0012, Natl. Res. Inst. Math. Comput. Sci</source>.</citation>
</ref>
<ref id="B154">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Vlierberghe</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Di Franco</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Philippe</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Baurain</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Decontamination, Pooling and Dereplication of the 678 Samples of the Marine Microbial Eukaryote Transcriptome Sequencing Project</article-title>. <source>BMC Res. Notes</source>. doi: <pub-id pub-id-type="doi">10.1186/s13104-021-05717-2</pub-id>.</citation>
</ref>
<ref id="B155">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vanni</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Schechter</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Acinas</surname> <given-names>S. G.</given-names>
</name>
<name>
<surname>Barber&#xe1;n</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Buttigieg</surname> <given-names>P. L.</given-names>
</name>
<name>
<surname>Casamayor</surname> <given-names>E. O.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Unifying the Known and Unknown Microbial Coding Sequence Space</article-title>. <person-group person-group-type="editor">
<name>
<surname>Brown</surname> <given-names>TC</given-names>
</name>
</person-group>
<source>ELife</source> <volume>11</volume>, <elocation-id>e67667</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.7554/eLife.67667</pub-id>
</citation>
</ref>
<ref id="B156">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Venter</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Remington</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Heidelberg</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>Halpern</surname> <given-names>A. L.</given-names>
</name>
<name>
<surname>Rusch</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Eisen</surname> <given-names>J. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2004</year>). <article-title>Environmental Genome Shotgun Sequencing of the Sargasso Sea</article-title>. <source>Science</source> <volume>304</volume> (<issue>5667</issue>), <fpage>66</fpage>&#x2013;<lpage>74</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1093857</pub-id>
</citation>
</ref>
<ref id="B157">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Villar</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Vannier</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Vernette</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lescot</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Cuenca</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Alexandre</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>The Ocean Gene Atlas: Exploring the Biogeography of Plankton Genes Online</article-title>. <source>Nucleic Acids Res.</source> <volume>46</volume>, <fpage>W289</fpage>&#x2013;<lpage>W295</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gky376</pub-id>
</citation>
</ref>
<ref id="B158">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wagner</surname> <given-names>G. P.</given-names>
</name>
<name>
<surname>Kin</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Lynch</surname> <given-names>V. J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Measurement of mRNA Abundance Using RNA-Seq Data: RPKM Measure Is Inconsistent Among Samples</article-title>. <source>Theory Biosci.</source> <volume>131</volume>, <fpage>281</fpage>&#x2013;<lpage>285</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12064-012-0162-3</pub-id>
</citation>
</ref>
<ref id="B159">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walworth</surname> <given-names>N. G.</given-names>
</name>
<name>
<surname>Saito</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>McIlvin</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Kellogg</surname> <given-names>R. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Why Environmental Biomarkers Work: Transcriptome-Proteome Correlations and Modeling of Multi-Stressor Experiments in the Marine Bacterium Trichodesmium</article-title>. <source>J. Proteome Res</source>. <volume>21</volume> (<issue>1</issue>), <fpage>77</fpage>&#x2013;<lpage>89</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/acs.jproteome.1c00517</pub-id>
</citation>
</ref>
<ref id="B160">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Gribskov</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Comprehensive Evaluation of <italic>De Novo</italic> Transcriptome Assembly Programs and Their Effects on Differential Gene Expression Analysis</article-title>. <source>Bioinformatics</source> <volume>33</volume>, <fpage>327</fpage>&#x2013;<lpage>333</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btw625</pub-id>
</citation>
</ref>
<ref id="B161">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weissman</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Dimbo</surname> <given-names>E.-R. O.</given-names>
</name>
<name>
<surname>Krinos</surname> <given-names>A. I.</given-names>
</name>
<name>
<surname>Neely</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Yag&#xfc;es</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Nolin</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Estimating the Maximal Growth Rates of Eukaryotic Microbes From Cultures and Metagenomes <italic>via</italic> Codon Usage Patterns</article-title>. <source>bioRxiv</source> doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2021.10.15.464604</pub-id>
</citation>
</ref>
<ref id="B162">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wilms</surname> <given-names>S. N.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A Beginner&#x2019;s Guide on Integrating *Omics Approaches to Study Marine Microbial Communities: Details and Discussions From Sample Collection to Bioinformatics Analysis</article-title>. <source>Front. Mar. Sci.</source> <volume>8</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2021.692538</pub-id>
</citation>
</ref>
<ref id="B163">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wilson</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Software Carpentry: Getting Scientists to Write Better Code by Making Them More Productive</article-title>. <source>Comput. Sci. Eng.</source> <volume>8</volume>, <fpage>66</fpage>&#x2013;<lpage>69</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/MCSE.2006.122</pub-id>
</citation>
</ref>
<ref id="B164">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>McCain</surname> <given-names>J. S.P.</given-names>
</name>
<name>
<surname>Rowland</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Middag</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Sandgren</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Allen</surname> <given-names>A. E.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Manganese and Iron Deficiency in Southern Ocean Phaeocystis Antarctica Populations Revealed Through Taxon-Specific Protein Indicators</article-title>. <source>Nat. Commun</source>. doi: <pub-id pub-id-type="doi">10.1038/s41467-019-11426-z</pub-id>.</citation>
</ref>
<ref id="B165">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Johnson</surname> <given-names>R. H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Meldrum</surname> <given-names>D. R.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Integrated Metagenomic and Metatranscriptomic Analyses of Microbial Communities in the Meso- and Bathypelagic Realm of North Pacific Ocean</article-title>. <source>Mar. Drugs</source> <volume>11</volume> (<issue>10</issue>), 3777&#x2013;<lpage>801</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/md11103777</pub-id>
</citation>
</ref>
<ref id="B166">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Thompson</surname> <given-names>K. N.</given-names>
</name>
<name>
<surname>Branck</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Nguyen</surname> <given-names>L. H.</given-names>
</name>
<name>
<surname>Franzosa</surname> <given-names>E. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Metatranscriptomics for the Human Microbiome and Microbial Community Functional Profiling</article-title>. <source>Annu. Rev. Biomed. Data Sci.</source> <volume>4</volume>, <fpage>279</fpage>&#x2013;<lpage>311</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev-biodatasci-031121-103035</pub-id>
</citation>
</ref>
<ref id="B167">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Gamini</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>von Schack</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Evaluation of Two Main RNA-Seq Approaches for Gene Quantification in Clinical RNA Sequencing: Polya+ Selection Versus rRNA Depletion</article-title>. <source>Sci. Rep.</source> <volume>8</volume>, <fpage>4781</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-018-23226-4</pub-id>
</citation>
</ref>
<ref id="B168">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zwiener</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Frisch</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Binder</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Transforming RNA-Seq Data to Improve the Performance of Prognostic Gene Signatures</article-title>. <source>PloS One</source> <volume>9</volume>, <elocation-id>e85150</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0085150</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>