<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2026.1769457</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Sampling microbial dynamics in the Salish Sea estuary: evaluating methods to capture cyanobacteria and cyanophage</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Boise</surname><given-names>Noelani R.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3236087/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Leiser</surname><given-names>Owen P.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1761030/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Jones</surname><given-names>Kristin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Peter-Frank</surname><given-names>Mahala</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Leach</surname><given-names>Damon</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Crafton-Tempel</surname><given-names>Stephen</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Regier</surname><given-names>Peter</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1232847/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Wu</surname><given-names>Ruonan</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1965869/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Phillips</surname><given-names>Conner</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Cheung</surname><given-names>Margaret S.</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Johnson</surname><given-names>Connah G. M.</given-names></name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3343222/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Edmundson</surname><given-names>Scott J.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3170391/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Pollock</surname><given-names>David D.</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3343354/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Coastal Sciences Division, Energy and Environment Directorate, Pacific Northwest National Laboratory</institution>, <city>Sequim</city>, <state>WA</state>, <country country="us">United States</country></aff>
<aff id="aff2"><label>2</label><institution>Nuclear, Chemical, and Biological Technologies Division, National Security Directorate, Pacific Northwest National Laboratory</institution>, <city>Seattle</city>, <state>WA</state>, <country country="us">United States</country></aff>
<aff id="aff3"><label>3</label><institution>Biological Sciences Division, Earth and Biological Sciences Directorate, Pacific Northwest National Laboratory</institution>, <city>Richland</city>, <state>WA</state>, <country country="us">United States</country></aff>
<aff id="aff4"><label>4</label><institution>AI and Data Analytics Division, National Security Directorate, Pacific Northwest National Laboratory</institution>, <city>Seattle</city>, <state>WA</state>, <country country="us">United States</country></aff>
<aff id="aff5"><label>5</label><institution>Environmental Molecular Sciences Laboratory, Pacific Northwest National Laboratory</institution>, <city>Richland</city>, <state>WA</state>, <country country="us">United States</country></aff>
<aff id="aff6"><label>6</label><institution>Physics Department, University of Washington</institution>, <city>Seattle</city>, <state>WA</state>, <country country="us">United States</country></aff>
<aff id="aff7"><label>7</label><institution>Advanced Computing, Mathematics, and Data Division, Physical and Computational Sciences Directorate, Pacific Northwest National Laboratory</institution>, <city>Richland</city>, <state>WA</state>, <country country="us">United States</country></aff>
<aff id="aff8"><label>8</label><institution>Department of Biochemistry and Molecular Genetics, University of Colorado School of Medicine</institution>, <city>Aurora</city>, <state>CO</state>, <country country="us">United States</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Scott J. Edmundson, <email xlink:href="mailto:Scott.Edmundson@pnnl.gov">Scott.Edmundson@pnnl.gov</email>; David D. Pollock, <email xlink:href="mailto:David.Pollock@CUAnschutz.edu">David.Pollock@CUAnschutz.edu</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-24">
<day>24</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>13</volume>
<elocation-id>1769457</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>30</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>26</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Boise, Leiser, Jones, Peter-Frank, Leach, Crafton-Tempel, Regier, Wu, Phillips, Cheung, Johnson, Edmundson and Pollock.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Boise, Leiser, Jones, Peter-Frank, Leach, Crafton-Tempel, Regier, Wu, Phillips, Cheung, Johnson, Edmundson and Pollock</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-24">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Picocyanobacteria from the genera <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> thrive across the globe in aquatic environments, have relatively small genomes, and have growth dynamics regulated by both viral interactions and abiotic conditions, making them excellent model organisms for exploring host-pathogencoevolution.</p>
</sec>
<sec>
<title>Methods</title>
<p>We developed and refined methods to sample and sequence cyanobacteria, cyanophages, and measured features of their abiotic environment.</p>
</sec>
<sec>
<title>Results</title>
<p>The protocol described herein can successfully discriminate large-cell eukaryotic organisms, but size fractionation of picocyanobacteria appears to be affected by the presence of free DNA, multicellular structures, and abundant tycheposons. Our preferred final protocol from this exploratory effort included a combination of in-line and single vacuum flask filtrations, which reduced filtration processing time by over threefold in some cases compared to other tested methods, such as a fully in-line sequence or in-site filtrations. We successfully extracted an average of approximately 400&#x2013;1200 ng for all filter fractions, with some variations between kits.</p>
</sec>
<sec>
<title>Discussion</title>
<p>The protocol described herein can successfully discriminate large-cell eukaryotic organisms, but size fractionation of picocyanobacteria appears to be affected by the presence of free DNA, multicellular structures, and abundant tycheposons.</p>
</sec>
</abstract>
<kwd-group>
<kwd>phage host interactions</kwd>
<kwd>phytoplankton</kwd>
<kwd>picocyanobacteria</kwd>
<kwd>Salish Sea</kwd>
<kwd>metagenomics</kwd>
<kwd>viral ecology</kwd>
<kwd>sampling methods</kwd>
<kwd>sequence diversity</kwd>
</kwd-group>
<funding-group>
<award-group id="gs1">
<funding-source id="sp1">
<institution-wrap>
<institution>Office of Science</institution>
<institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/100006132</institution-id>
</institution-wrap>
</funding-source>
</award-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. The research described in this paper is supported by the NW-BRaVE for Biopreparedness project funded by the U. S. Department of Energy (DOE), Office of Science, Office of Biological and Environmental Research, under FWP 81832. A portion of this research was performed on a project award (Enhancing biopreparedness through a model system to understand the molecular mechanisms that lead to pathogenesis and disease transmission) from the Environmental Molecular Sciences Laboratory, a DOE Office of Science User Facility sponsored by the Biological and Environmental Research program. Pacific Northwest National Laboratory is a multi-program national laboratory operated by Battelle for the DOE under Contract DE-AC05-76RL01830. This research used resources of the Oak Ridge Leadership Computing Facility at the Oak Ridge National Laboratory, which is supported by the Advanced Scientific Computing Research programs in the DOE Office of Science under Contract No. DE-AC05-00OR22725.</funding-statement>
</funding-group>
<counts>
<fig-count count="11"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="62"/>
<page-count count="18"/>
<word-count count="10619"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Aquatic Microbiology</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>The picocyanobacteria <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> are collectively a ubiquitous component of phytoplankton and play an outsized role in global primary production in both freshwater and marine systems (<xref ref-type="bibr" rid="B54">Visintini et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B7">Callieri et&#xa0;al., 2022</xref>). They have a large geographic distribution year-round  (<xref ref-type="bibr" rid="B14">Flombaum et&#xa0;al., 2013</xref>), but are more abundant in warm summer months (<xref ref-type="bibr" rid="B61">Zinser et&#xa0;al., 2006</xref>). The picocyanobacteria <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> are collectively a ubiquitous component of phytoplankton and play an outsized role in global primary production in both freshwater and marine systems (<xref ref-type="bibr" rid="B7">Callieri et&#xa0;al., 2022</xref>, <xref ref-type="bibr" rid="B54">Visintini et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B7">Callieri et&#xa0;al., 2022</xref>). They have a large geographic distribution year-round (<xref ref-type="bibr" rid="B14">Flombaum et&#xa0;al., 2013</xref>, <xref ref-type="bibr" rid="B14">Flombaum et&#xa0;al., 2013</xref>), but are more abundant in warm summer months (<xref ref-type="bibr" rid="B61">Zinser et&#xa0;al., 2006</xref>, <xref ref-type="bibr" rid="B61">Zinser et&#xa0;al., 2006</xref>). Typically ranging in size from 0.5&#x2013;0.8 and 0.8&#x2013;1.2 &#x3bc;m diameter, respectively, (<xref ref-type="bibr" rid="B38">Mella-Flores et al. 2012</xref>) the picocyanobacteria <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> are collectively a ubiquitous component of phytoplankton and play an outsized role in global primary production in both freshwater and marine systems (<xref ref-type="bibr" rid="B54">Visintini et al. 2021</xref>; <xref ref-type="bibr" rid="B7">Callieri et al. 2022</xref>), <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> are among the most abundant photosynthetic organisms on Earth and are key indicators of ecosystem health (<xref ref-type="bibr" rid="B49">S&#xe1;nchez-Gallego et&#xa0;al., 2025</xref>). Due to their prevalence in various marine and estuarine ecosystems, their relatively small genomes, and their anti-viral potential (e.g., cyanovirin-N, a potent antiviral lectin), these organisms are exceptional model organisms for studying viral-bacterial dynamics (<xref ref-type="bibr" rid="B54">Visintini et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B50">Scanlan et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B42">Reynolds et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B13">Edmundson et&#xa0;al., 2020</xref>). Well-adapted to oligotrophic conditions (<xref ref-type="bibr" rid="B28">Kent et&#xa0;al., 2019</xref>), they also thrive in the euphotic zone of tropical and subtropical waters and are expected to expand their distribution as ocean temperatures rise and impact oceanic communities (<xref ref-type="bibr" rid="B15">Flombaum et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B14">Flombaum et&#xa0;al., 2013</xref>). Given their ubiquity, these organisms are likely present in the coastal and estuarine waters of the northern Olympic Peninsula of Washington State, USA and surrounding Salish Sea waters, but few studies specifically focus on picocyanobacteria in this region (<xref ref-type="bibr" rid="B10">Del Bel Belluz et&#xa0;al., 2024</xref>). The Salish Sea lies along what was historically considered the northern boundary of the distribution of <italic>Prochlorococcus</italic> (defined by <italic>Prochlorococcus</italic> versus <italic>Synechococcus</italic> prevalence ratios), but this boundary is expected to have shifted and continue to change as ocean temperatures increase (<xref ref-type="bibr" rid="B43">Ribalet et&#xa0;al., 2025</xref>; <xref ref-type="bibr" rid="B14">Flombaum et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B39">Mioduchowska et&#xa0;al., 2023</xref>), making the changing interactions and relative success of <italic>Prochlorococcus</italic>, <italic>Synechococcus</italic>, and their viruses topics of considerable ecological and biopreparedness interest (<xref ref-type="bibr" rid="B13">Edmundson et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B42">Reynolds et&#xa0;al., 2021</xref>).</p>
<p>The Salish Sea is an expansive network of complex water bodies including the Strait of Juan de Fuca, the Strait of Georgia, and Puget Sound. Kathryn Sobocinski&#x2019;s <italic>The State of the Salish Sea</italic> report showcases the dynamic currents and biogeochemistry of these waters (<xref ref-type="bibr" rid="B53">Sobocinski, 2021</xref>). Strong upwelling of deep, nutrient-rich water due to outflow of freshwater from the Strait of Juan de Fuca produces dynamic seasonal fluctuations. This wind-driven upwelling of deep water can also decrease dissolved oxygen (DO) levels and increase nutrient-rich water from the coast which circulates through the strait. Wastewater from the heavily populated coastal areas around the Salish Sea also has significant effects on nutrient levels and thus cyanobacterial populations in these water bodies; in the summer, reduced freshwater outflow can lead to stagnant wastewater effluent and agricultural runoff in small regions of the Salish Sea, increasing seasonal eutrophication (<xref ref-type="bibr" rid="B53">Sobocinski, 2021</xref>). Despite extensive research on impacts of environmental conditions on picocyanobacteria, there is far less work documenting the impact of environmental factors on picocyanobacteria-cyanophage dynamics. Some work shows examples of environmental impacts, such as diel cycles impacting cyanobacterial gene expression and phage-host interactions (<xref ref-type="bibr" rid="B31">Liu et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B46">Rozum et&#xa0;al., 2025</xref>) and infection rates increasing in euphotic zones (<xref ref-type="bibr" rid="B16">Fuchsman and Hays, 2023</xref>).</p>
<p>While there are many commonly-used methods to sample specific microorganisms from aqueous environments (<xref ref-type="bibr" rid="B24">Huang et&#xa0;al., 2023</xref>), especially for public health end-uses (<xref ref-type="bibr" rid="B26">Karamati et&#xa0;al., 2024</xref>), there are few methods that provide relatively rapid samples targeting multiple size fractions from the same source water while simultaneously producing enough sample biomass for sufficient downstream genomic sequencing to elucidate community dynamics (<xref ref-type="bibr" rid="B26">Karamati et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B59">Zehr, 2010</xref>; <xref ref-type="bibr" rid="B23">Hshieh and Maloney, 2025</xref>). Methods such as flow cytometry (<xref ref-type="bibr" rid="B47">Ruber et&#xa0;al., 2018</xref>), eDNA sampling (<xref ref-type="bibr" rid="B48">Sahu et&#xa0;al., 2025</xref>), filter plating (<xref ref-type="bibr" rid="B27">Kearney et&#xa0;al., 2022</xref>), dilution-to-extinction (<xref ref-type="bibr" rid="B4">Buchholz et&#xa0;al., 2021</xref>), and density gradient centrifugation (<xref ref-type="bibr" rid="B45">Rong et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B29">Lawrence and Steward, 2010</xref>) can successfully identify or isolate target organisms, but require expensive equipment and refined expertise, have more limitations on target organisms than sequential filtration, and/or lack sequencing depth potential (<xref ref-type="bibr" rid="B1">Adams et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B52">Sharifian Gh. and Norouzi, 2023</xref>). Our described sampling method enables the isolation of multiple size fractions&#x2014;such as viruses and hosts&#x2014;from a discrete timeframe without culturing, as well as the simultaneous collection of metadata to inform the environmental context in which these organisms were found. By establishing consistent methods to obtain quality genomic and environmental data across locations, seasons, tidal stages, and diel cycles, this work yields holistic information to assess changing dynamics between marine cyanophages and picocyanobacteria, which can inform models that predict the behavior of higher-risk species. In a time of increasing risks in viral-host adaptations and spillover due to rapid environmental change (<xref ref-type="bibr" rid="B8">Carlson et&#xa0;al., 2022</xref>), it is critical that the scientific community establish consolidated methods for pairing environmental data with molecular research at a large scale to understand past, present, and future adaptation and interactive responses between viruses and their hosts. In addition to elucidating genomic relationships between phages and hosts, understanding the broader ecological and biogeochemical processes of discrete sample collections is essential for increasing predictive accuracy and capacity in model development (<xref ref-type="bibr" rid="B11">Dorigatti et&#xa0;al., 2025</xref>).</p>
<p>In this study, we tested and improved methods to sample and filter raw environmental water samples to extract DNA, identify picocyanobacteria and their associated phages, and describe their abiotic environment, with the long-term aim to study host-pathogen interactions and coevolution. To achieve this, we collected samples from five locations at varying times of day and tidal conditions along the northern Olympic Peninsula over an initial year-long period while performing iterative method development. Sampling involved collecting surface-level samples either via in-line <italic>in situ</italic> serial filtration or direct surface sampling. Due to the wide variety and size distribution of phytoplankton organisms and specifically cyanobacteria (<xref ref-type="bibr" rid="B37">Mehdizadeh Allaf and Peerhossaini, 2022</xref>), we performed serial filtrations to remove larger debris and to reduce the amount of larger-celled non-target organisms prior to sequencing. We focused on identifying relative read counts of target organisms in the genera <italic>Prochlorococcus and Synechococcus</italic>, along with previously identified cyanophage pathogens. Based on preliminary results showing that reads similar to eukaryotic amoeba were consistently observed in our samples, we used relative amoeba read counts as a marker for removal of large-celled organisms.</p>
<p>In summary, the present work describes the development and evaluation of methods for enriching and analyzing picocyanobacteria and associated cyanophages in the Salish Sea for metagenomic sequencing, along with preliminary observations of select lineages under various collection conditions over time. This work highlights the efficacy and replicability of sequential filtration and DNA extraction protocols to support studies of host-pathogen dynamics and environmental impacts on microbial interactions.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="s2_1">
<title>Sampling, filtering and processing</title>
<p>We performed initial targeted sampling in Salish Sea waters from November 2023 to February 2025, mostly from the PNNL-Sequim floating dock and pier, and less frequently at four nearby locations: Cline Spit, south of John Wayne Marina near an estuary outflow, open waters North of Port Townsend, and in Discovery Bay (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>; <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>). Sampling events, including filtering and collection (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2</bold></xref>, <xref ref-type="fig" rid="f3"><bold>3</bold></xref>) occurred near-monthly at the PNNL-Sequim dock over the course of a year, with offsite sampling and multiple within-month sampling concentrated during peak summer months. A total of 30 primary sampling events were performed on 25 separate days at ebb, flood, and slack tides, with the majority occurring during flood tides. Water levels, temperature, salinity, and collection dates are shown in <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Sample location descriptions for marked sites in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">site reference number</th>
<th valign="middle" align="left">Sampling location</th>
<th valign="middle" align="left">Site coordinates</th>
<th valign="middle" align="left"># of sampling events</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">1</td>
<td valign="middle" align="left">Cline Spit Loading Dock</td>
<td valign="middle" align="left">48&#xb0;09&#x2019;06&#x201d;N 123&#xb0;09&#x2019;09&#x201d;W</td>
<td valign="middle" align="left">n = 1</td>
</tr>
<tr>
<td valign="middle" align="left">2</td>
<td valign="middle" align="left">PNNL-Sequim Floating Dock</td>
<td valign="middle" align="left">48&#xb0;04&#x2019;45&#x201d;N 123&#xb0;02&#x2019;42&#x201d;W</td>
<td valign="middle" align="left">n = 26</td>
</tr>
<tr>
<td valign="middle" align="left">3</td>
<td valign="middle" align="left">Exterior southern side of John Wayne Marina</td>
<td valign="middle" align="left">48&#xb0;03&#x2019;41&#x201d;N 123&#xb0;02&#x2019;20&#x201d;W</td>
<td valign="middle" align="left">n = 1</td>
</tr>
<tr>
<td valign="middle" align="left">4</td>
<td valign="middle" align="left">Southern end of Discovery Bay</td>
<td valign="middle" align="left">47&#xb0;59&#x2019;48&#x201d;N 122&#xb0;52&#x2019;32&#x201d;W</td>
<td valign="middle" align="left">n = 1</td>
</tr>
<tr>
<td valign="middle" align="left">5</td>
<td valign="middle" align="left">Open water north of Port Townsend</td>
<td valign="middle" align="left">48&#xb0;09&#x2019;56&#x201d;N 122&#xb0;48&#x2019;24&#x201d;W</td>
<td valign="middle" align="left">n = 1</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>All sites were sampled only once due to logistical challenges except for the PNNL-Sequim dock site, which was sampled 26 times in year one.</p></fn>
</table-wrap-foot>
</table-wrap>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Sampling locations in the Salish Sea during the first year of sampling. 1) Cline Spit boat launch, 2) PNNL-Sequim floating dock, 3) Southern side of John Wayne Marina near estuary outflow, 4) Discovery Bay, 5) North of Port Townsend. All locations are located near the entrance of Admiralty Inlet from the Pacific Ocean. Satellite imagery generated using Google Earth. Inset (left) map data attribution: Google, Landsat/Copernicus Data SIO, NOAA, U.S. Navy, NGA, GEBCO Data LDEO-Columbia, NSF, NOAA Imagery from the dates: 12/14/2015&#x2013;1/1/2021. Regional map (right) map data attribution: Google, Airbus Data, SIO, NOAA, U.S. Navy, NGA, GEBCO Imagery from the dates: 9/27/2004&#x2013;10/14/2025.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g001.tif">
<alt-text content-type="machine-generated">Satellite map showing the Salish Sea and nearby land in the Pacific Northwest, with an inset highlighting five marked locations: Cline Spit, PNNL Sequim Floating Dock, South Side of John Wayne Marina, Discovery Bay, and North of Port Townsend.</alt-text>
</graphic></fig>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Serial filtration fractions. The projected target species enrichment goals for size fractionation are shown. The four fractions are: macro (&gt; 20 &#xb5;m); micro (5-20 &#xb5;m); pico (and small micro, 0.22-5 &#xb5;m); and viral (filtered through 0.22 &#xb5;m, then precipitated, then collected on 0.22 &#xb5;m filters). Note that the labels for these fractions are rough approximations, and the &#x201c;pico&#x201d; fraction in particular is generous at the upper end (5 &#xb5;m) to avoid filtering out organisms with irregularly grouped cells at the larger end of the picocyanobacterial range (<italic>Prochlorococcus</italic> 0.5-0.7 &#xb5;m, <italic>Synechococcus</italic> 0.8-1.5 &#xb5;m).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g002.tif">
<alt-text content-type="machine-generated">Diagram illustrating water filtration process through four filter fractions: macro (over 20 micrometers, e.g., diatoms, plankton), micro (5&#x2013;20 micrometers, mid-sized cyanobacteria), pico (0.22&#x2013;5 micrometers, picocyanobacteria), and viral (under 0.22 micrometers, cyanophages, free-floating environmental DNA), with examples of organisms or material captured at each stage.</alt-text>
</graphic></fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Final sampling scheme. Scheme incorporates a combination of in-line filtrations and single-flask filtrations to increase time-efficiency, minimize material waste, and improve yield of pico and viral fractions. Filters were replicated either as subsequent replacement filters in the in-line or flask filtration process, or as cut fractions through the midpoint of the filter, obtained by physically cutting individual filters after sample collection.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g003.tif">
<alt-text content-type="machine-generated">Flowchart illustrating an eight-step process for environmental sample filtration and DNA extraction, with labeled diagrams and images showing filter subsamples and corresponding DNA subsample tubes for macro, micro, pico, and viral fractions.</alt-text>
</graphic></fig>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Seasonal data for water levels, temperature, and salinity. Values were measured using the MCRL Data sensor suite with denoted sampling events from 2024-2025.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g004.tif">
<alt-text content-type="machine-generated">Three-panel scientific chart displays time series for water level, water temperature, and salinity from January 2024 to March 2025. Triangles highlight specific data points with associated numeric annotations. Water level fluctuates between approximately negative one and three meters, water temperature ranges from about eight to sixteen degrees Celsius, and salinity varies from approximately thirty to thirty-three PSU.</alt-text>
</graphic></fig>
<p>Samples were collected using two pilot methods, either 1) time-discrete samples using a horizontal water sampler, Niskin bottle, or direct surface sampling using a sterilized carboy; or 2) time-extended <italic>in situ</italic> in-line filtrations at the sampling site. The <italic>in-situ</italic> apparatus consisted of a custom-designed, weighted metal frame attached to flexible tubing that we tested using both peristaltic and vacuum pumps at approximately 550&#x2013;680 kPa and 130 kPa, respectively (<xref ref-type="supplementary-material" rid="SF1"><bold>Supplementary Table&#xa0;1</bold></xref>). We configured the tubing as an <italic>in-situ</italic> mechanism for two- and three-step serial filtrations using in-line filters that could be deployed from height and immediately pump raw seawater directly through two or three sequentially smaller filter sizes to capture target species, with the final filtrate collected into a sterile vessel. Alternatively, we used a direct water sampler (a Niskin bottle, horizontal water sampler, and/or a sterilized carboy) to collect discrete samples followed by filtrations in a laboratory. The in-line system collected samples over extended periods of time (up to 3 hours with especially dense water samples through a three-step filtration), compared to sampling durations of less than one minute using a direct water sampler.</p>
<p>Prior to sampling events, all sample collection vessels (carboys, Niskin bottles, and horizontal water samplers) were sterilized by autoclave or disinfected using a 10% bleach solution. We primed the collection vessel, tubing, and priming filters prior to every sample collection with water from the site, then discarded the priming water away from the collection point to avoid contamination. After collecting a pre-determined target volume, we immediately recorded metadata and sampling event context and assigned a single parent sampling ID to all associated data. Sampling conditions were noted, and additional weather data from the day of sampling were downloaded from the PNNL-Sequim Marine and Coastal Research Laboratory (MCRL) data site (<xref ref-type="bibr" rid="B34">MCRL Data, 2025</xref>).</p>
<p>Depending on which fractions were already processed, we then transported samples to our laboratory in Sequim WA to process the remaining filter fractions. All tubing and vessels were rinsed with 70% ethanol and/or autoclaved prior to priming with the appropriate matrix (we used each sequential filtrate to prime the subsequent collection vessels). For most samples, this involved a combination of in-line filtrations (20&#xb5;m 47 mm nylon filter and a 5 &#xb5;m 47 mm mixed-cellulose ester (MCE) membrane secured in either a Millipore 47 mm polypropylene nylon filter holder or a Cytiva 47mm polycarbonate in-line filter holder using a peristaltic pump, <xref ref-type="supplementary-material" rid="SF2"><bold>Supplementary Tables&#xa0;2</bold></xref>, <xref ref-type="supplementary-material" rid="SF3"><bold>3</bold></xref>) and single vacuum flask filtrations. In-line filtration was followed by mixing in a single-flask and filtration onto a sterile 0.22 &#xb5;m polyethersulfone (PES) or MCE filter in a vacuum flask to capture the pico fraction. Flow-throughs from the 0.22 &#xb5;m filter were precipitated using a method adapted from <xref ref-type="bibr" rid="B25">John et&#xa0;al. (2011)</xref>; iron chloride hexahydrate was added to the filtrate at 1 mL of 10g/L FeCl &#xb7; 6H<sub>2</sub>O solution in deionized water per 20 L of seawater and incubated for 1 hour, and precipitates were captured on a sterile 0.22 &#xb5;m PES filter via vacuum filtration.</p>
<p>Additional filtration setups we tested included a 0.05 &#xb5;m filter after 0.22 &#xb5;m filtration, and various alternate size combinations with the three filter types: nylon, MCE membranes, and PES. Specifically, we tested 47 mm and 90 mm 0.22 or 0.2 &#xb5;m MCE or PES filters, either as individual, sterile membranes or sterile vacuum units. We tested the 5 &#xb5;m and 0.22 &#xb5;m MCE membranes in an in-line filtration setup using either a polycarbonate filter-holder purchased from Avantor Sciences or a polypropylene filter-holder purchased from Millipore Sigma. The long-term use of 47 and 90 mm filters for differing filter fractions was driven by limited commercial availability of each material-pore size-diameter combination and for time-efficiency. A list of the tested filters, in-line filter holders, and other product information can be found in <xref ref-type="supplementary-material" rid="SF1"><bold>Supplementary Tables&#xa0;1</bold></xref>-<xref ref-type="supplementary-material" rid="SF4"><bold>4</bold></xref>.</p>
<p>In the final sampling scheme, the sampling process included separating environmental samples by serial filtration into four fractions (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>), labelled by their target organism size and the nominal pore sizes of the filters which they passed through and on which they were collected: macro (&gt; 20 &#xb5;m), micro (large micro, 5-20 &#xb5;m), pico (small micro, 0.22-5 &#xb5;m), and viral (&lt; 0.22 &#xb5;m).&#x200b; Further details are provided in <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>. Note that filter subsamples for the 20 &#xb5;m and 5 &#xb5;m filters were obtained by changing filters as they became clogged (as estimated qualitatively by reduced flow rate), whereas most filter subsamples for the 0.22 &#xb5;m filters (both the pico and the viral fractions) were obtained by physically cutting&#xa0;the filters into thirds or quarters after completion of filtration (<xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>).</p>
</sec>
<sec id="s2_2">
<title>DNA extraction</title>
<p>DNA was extracted from selected filter subsamples using Zymo&#x2019;s Quick DNA Plant/Seed Miniprep Kit, and three Qiagen kits: DNeasy PowerWater Kit, PowerSoil Pro Kit, or Blood and Tissue Kit (<xref ref-type="supplementary-material" rid="SF4"><bold>Supplementary Table&#xa0;4</bold></xref>). Following extraction, DNA quality and quantity were assessed using a NanoDrop One spectrophotometer (ThermoFisher Scientific, Waltham, MA, USA) and Qubit4 fluorometer system (ThermoFisher Scientific, Waltham, MA, USA). Samples were then frozen, and a select few were later analyzed on an Agilent 4150 TapeStation for quality assessment (<xref ref-type="supplementary-material" rid="SF6"><bold>Supplementary Data Figure&#xa0;1</bold></xref>). Samples were opportunistically selected for comparative analyses and were chosen based on sample factors such as number of technical replicates, the filter size, date of sampling and extractions, and tidal stage. While we did not have sufficient sample numbers for controlled comparisons in many cases, we chose the most comparable samples from the larger exploratory set and excluded samples that were too variable.</p>
<p>For direct comparisons of the kit effect on DNA recovery, DNA from select sampling events were extracted using two separate kits (Blood &amp; Tissue and PowerWater) and analyzed on an Agilent 4150 TapeStation using a D5000 ScreenTape and the relevant kit reagents (D5000 buffer and D5000 ladder) following the kit protocol with no modifications (Agilent Technologies, Palo Alto, CA, USA). To understand whether levels of variability due to kits are large compared to other sources of variation, we also make comparisons of DNA recovery without controlling for other known variables, which we refer to as &#x2018;kitchen sink&#x2019; comparisons (a mix of conditions and replicates) to clarify the context in which they should be interpreted.</p>
</sec>
<sec id="s2_3">
<title>Metadata collection and processing</title>
<p>PNNL-Sequim is uniquely positioned for marine environmental research, leveraging its bench-to-bay capabilities through direct access to Sequim Bay, raw seawater access in the facilities, and a unique array of permanently deployed environmental sensors (<xref ref-type="bibr" rid="B34">MCRL Data, 2025</xref>). Most sampling events took place from the PNNL-Sequim floating dock at the mouth of Sequim Bay with an extensive range of environmental parameters documented from the MCRL Data, while other locations relied solely on parameters captured from a YSI ProDSS multiparameter water quality meter (YSI Xylem, Yellow Springs OH) (<xref ref-type="supplementary-material" rid="SF5"><bold>Supplementary Data Table&#xa0;5</bold></xref>). For PNNL-Sequim sampling events, we acquired data post-sampling using targeted scripts (<xref ref-type="bibr" rid="B35">MCRLdata Sandbox, 2025a</xref>; <xref ref-type="bibr" rid="B36">MCRLdata Sandbox, 2025b</xref>) to process environmental data from an online data repository (<xref ref-type="bibr" rid="B34">MCRL Data, 2025</xref>). One sampling event used for a controlled membrane test was executed in PNNL&#x2019;s marine mesocosm system, which circulates unfiltered seawater through a large (ca. 62,000 L) outdoor tank (<xref ref-type="bibr" rid="B33">Marine and Coastal Research Laboratory, 2025</xref>). This mesocosm system was used for a single sampling event due to restricted access to the PNNL-Sequim floating dock during the scheduled sampling time. While the samples from the mesocosm and dock are not directly comparable, the mesocosm system is constantly circulated with raw seawater with a submerged intake a few meters away the floating dock.</p>
<p>We used data collected for tidal stage, water temperature, and salinity by the sensors described above to provide environmental context for sampling events off the PNNL-Sequim dock (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>). Data collected by sensors are sent to the cloud where they undergo automated initial quality control and displayed in near real-time (<xref ref-type="bibr" rid="B34">MCRL Data, 2025</xref>) and are provided as part of the joint metadata summary (<xref ref-type="bibr" rid="B35">MCRLdata Sandbox, 2025a</xref>; <xref ref-type="bibr" rid="B36">MCRLdata Sandbox, 2025b</xref>). Additional quality control combining automated (e.g. de-spiking) and manual visual assessment were then applied, resulting in several data gaps originating from sensor maintenance, sensor errors, or unreliable data (identified during quality control). To fill any gaps, we used the <italic>ranger</italic> R package to construct Random Forest models (<xref ref-type="bibr" rid="B58">Wright and Ziegler, 2017</xref>). First, we gap-filled water levels by building a Random Forest model using water levels (<xref ref-type="bibr" rid="B41">NOAA Tides and Currents, 2025</xref>) pulled using the <italic>VulnToolkit</italic> R package along with hour of day, and day of year as predictors (<xref ref-type="bibr" rid="B22">Hill et&#xa0;al., 2021</xref>). The resulting model (R<sup>2</sup> = 0.96) was then used to gap-fill water levels. Those gap-filled water levels were used (along with hour of day and day of year) to predict both water temperature and salinity measured off the MCRL dock by CTD (conductivity, temperature, and depth sensor), and those models were used to gap-fill both temperature and salinity time-series. Model goodness-of-fit was high for both temperature and salinity models (R<sup>2</sup> = 0.93 and 0.95, respectively).</p>
</sec>
<sec id="s2_4">
<title>Sequencing and preliminary data processing</title>
<p>DNA subsamples were shipped on ice to Azenta Life Sciences (South Planfield, NJ,USA) for sequencing. Sequencing libraries were prepared using NEBNext Ultra DNA Library Prep Kit (New England Biolabs, Ipswich, MA, USA) according to manufacturer&#x2019;s instructions. Briefly, genomic DNA was acoustically fragmented using a Covaris S220 instrument (Covaris, Woburn, MA, USA) and fragmented DNA was cleaned and end repaired. Sequencing adapters were ligated to 3&#x2019; ends of fragments after adenylation and enriched by limited-cycle PCR. Sequence libraries were validated using a High Sensitivity D1000 ScreenTape on an Agilent TapeStation (Agilent Technologies, Palo Alto, CA, USA) and quantified using a Qubit 3.0 fluorometer (ThermoFisher Scientific, Waltham, MA, USA). Sequence libraries were also quantified using real-time PCR (Applied Biosystems, Carlsbad, CA, USA) libraries from samples that passed all quality control steps and were multiplexed and clustered onto an Illumina NovaSeq flowcell (Illumina, San Diego, CA, USA) and sequenced using 2x150 paired-end configuration. Base calling and image analysis were conducted using the NovaSeqControl Software. Raw sequence data was converted to fastq format and de-multiplexed using Illumina&#x2019;s bcl2fastq software v2.20, allowing one mismatch for index sequence identification. Sequencing datasets were processed through the sequence processing pipelines described below for evaluation of the efficacy of filter fractionation methods and to refine strategies for further sampling. Raw paired-end reads were sequentially pre-processed by first interleaving paired reads into a single sequence read file preserving read pair information using the reformat functionality of BBTools v37.62 (<xref ref-type="bibr" rid="B6">Bushnell et&#xa0;al., 2017</xref>). Interleaved reads were clustered, with optical and PCR duplicate reads removed using clumpify within BBTools. Reads derived from low-quality regions of flowcells were removed using the filterbytile functionality from BBTools. BBTools bbduk was used to sequentially remove Illumina sequencing adapters, bases from the ends of reads below a phred33 quality score of ten, any reads with an overall phred33 quality score lower than ten, and any reads mapping to PhiX spike-in. Read quality was assessed before and&#xa0;after preprocessing using FastQC v0.12.1 (<xref ref-type="bibr" rid="B3">Babraham Institute, 2023</xref>).</p>
<p>We generated metagenome contig assemblies using MEGAHIT v1.2.9 (<xref ref-type="bibr" rid="B30">Li et&#xa0;al., 2015</xref>) under default settings in paired-end mode. Output contigs were filtered by length as required for downstream analyses using the reformat functionality of BBTools. Assembly qualities were assessed using QUAST v5.3.0 (<xref ref-type="bibr" rid="B19">Gurevich et&#xa0;al., 2013</xref>). Putative coding regions and putative protein sequences were predicted within metagenome assemblies filtered to contigs larger than 2500 bases using Metaprokka v1.15.0 (<xref ref-type="bibr" rid="B51">Seemann, 2014</xref>).</p>
<p>Raw short read pairs, interleaved pre-processed reads, contig assemblies, and predicted genes and proteins are found in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Data 3</bold></xref> and were deposited to BioProject PRJNA1336290.</p>
</sec>
<sec id="s2_5">
<title>FAIR data management</title>
<p>We assigned each sampling event a unique parent ID that was tagged to the relevant environmental data for every filter and DNA subsample, which also had its own unique subsample ID. To track sampling events, we created a standardized field form with nomenclature and categorization based on the National Microbiome Data Collaborative (NMDC) water sample template for data documentation compatibility with the other public repositories (<xref ref-type="bibr" rid="B40">National Microbiome Data Collaborative, 2026</xref>). The unique sample identifiers for all parent and subsamples were used to further facilitate consistent data integration. Sequences, processed sequences, analytical results and associated metadata were captured and a) stored for sharing among the team using DataFed federated data storage and Globus-enabled federated IDs to ensure that this data is searchable and well-structured (<xref ref-type="bibr" rid="B18">George et&#xa0;al., 2025</xref>; <xref ref-type="bibr" rid="B12">EcoKMER GitHub Software Repository, 2025</xref>) and b) harmonized and visualized using the concurrently-developed EcoKMER program (<xref ref-type="bibr" rid="B18">George et&#xa0;al., 2025</xref>) with final output stored as a CSV file (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Data 1</bold></xref>). This integrated metadata file combined sequencing summary information with environmental and contextual data, adhering to FAIR (Findable, Accessible, Interoperable, and Reusable) principles (<xref ref-type="bibr" rid="B57">Wilkinson et&#xa0;al., 2016</xref>) and ensures that this data is searchable and well-structured.</p>
</sec>
<sec id="s2_6">
<title>Microbial sequence diversity estimation</title>
<p>To assess sequence diversity across environmental metagenomes, we applied Nonpareil (v3.5.5) to interleaved pre-processed reads (<xref ref-type="bibr" rid="B44">Rodriguez-R et&#xa0;al., 2018</xref>). Because the default kmer size for Nonpareil is 24, reads shorter than 24 base pairs (bp) were excluded. Nonpareil estimates average community coverage and diversity using kmer redundancy, modeling the rate at which new 24 bp sequences are encountered with increasing sequencing effort. The resulting Nonpareil diversity index (Nd) used does not cleanly reflect microbial diversity, as it reports diversity inferred from identical 24mers sampled, and does not account for variable rates along genomes, or variable genome size, but it has nevertheless been demonstrated to be useful in detecting differences in community composition (<xref ref-type="bibr" rid="B44">Rodriguez-R et&#xa0;al., 2018</xref>).</p>
</sec>
<sec id="s2_7">
<title>Relative read coverage of target taxa</title>
<p>61 DNA subsamples produced in year one were sequenced, filtered, assembled into contigs, and 24mer sequence diversities were calculated. To quantify taxon-specific enrichment of organisms with varying sizes, we mapped metagenomic reads to curated reference genome sets using BBMap (v39.13) (<xref ref-type="bibr" rid="B5">Bushnell, 2014</xref>). Five reference genome sets were constructed from high-quality, complete NCBI genomes representing <italic>Prochlorococcus</italic> (26 reference genomes), <italic>Synechococcus</italic> (78 reference genomes), their phages (341 <italic>Synechococcus</italic> phage genomes; 37 <italic>Prochlorococcus</italic> phage genomes), and <italic>Acanthamoeba</italic> spp (5 reference genomes; accession numbers of each reference set in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Data 2</bold></xref>). Our main reason to focus on these taxon groups was to identify the relative occurrence of the two picocyanobacterium and cyanophages that might be associated with them. In addition, we separately mapped reads to a mycetezoan amoeba to determine the effectiveness of filtering out large-celled organisms. Each set was indexed using the BBMap indexing utility. Quality-filtered reads from each sample were aligned to each reference genome set using default parameters, and coverage statistics were calculated with the BBMap pileup utility (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Data 1</bold></xref>), which attaches each read to the reference genome in a run that matches it best, and leaves unattributed any reads that do not pass the minimum matching cutoff to any included genome(s). We repeated this analysis using the curated CyanoRak database of <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> reference samples (<xref ref-type="supplementary-material" rid="SF8"><bold>Supplementary Figure&#xa0;3</bold></xref>), with highly correlated results between our analysis and that using CyanoRak (<xref ref-type="bibr" rid="B17">Garczarek et&#xa0;al., 2021</xref>).</p>
<p>Each of the six genome groups listed above were analyzed separately. During preliminary analysis, we observed that the bulk of <italic>Acanthamoeba</italic> reads were consistently attributed to the five major chromosomes of <italic>Dictyostelium discoideum</italic>, so we opted to present the sum of plus and minus reads (relative to genome orientation) most preferentially attributed to these five chromosomes as a marker for large-celled amoeboid organisms. <italic>Dictyostelium discoideum</italic> is nominally a soil organism, but the representation of diverse amoeboid organisms in the genome references was not strong, and these results should not be construed to positively indicate an undue degree of soil contamination in estuarine waters or to identify the actual genus or species source in these aquatic samples&#x2014;relative amoeba read counts were only used as a marker for removal of large-celled organisms. For other runs, we report the sum of the plus and minus reads for all genomes in the reference set. To normalize differences in sequencing depth, total read counts per sample were used to compute reads per million (RPM). For comparison, we ran Kraken/Bracken (<xref ref-type="bibr" rid="B32">Lu et&#xa0;al., 2022</xref>) using version 2.0.7-beta of the Kraken database using default parameters, outputting the total reads that were attributable to the groups <italic>Prochlorococcus</italic>, <italic>Synechococcus</italic>, and <italic>Dictyoselium discoideum</italic>. The output is reported in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Data 1</bold></xref>. Read counts using Bracken are generally lower than for BBMap, likely due to use of a smaller reference database and differences in default parameters.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Sample collection and processing</title>
<p>Available pumps (see Methods and <xref ref-type="supplementary-material" rid="SF1"><bold>Supplementary Table&#xa0;1</bold></xref>), including eDNA and peristaltic models, did not reliably generate enough power to overcome sampling challenges at height from piers or vessels, so direct surface sampling was preferred over <italic>in-situ</italic> filtration. Biomass accumulation quickly clogged the 0.22 &#xb5;m inline filter, which inhibited consistent flow and led to eventual removal of 0.22 &#xb5;m inline filters from our protocol in favor of flask filtration of the mixed 5 &#xb5;m filtrate in the tertiary filtration step (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2</bold></xref>, <xref ref-type="fig" rid="f3"><bold>3</bold></xref>).</p>
<p>Millipore&#x2019;s 47 mm polypropylene nylon in-line filter holders improved flow rates over Cytiva&#x2019;s 47 mm polycarbonate filter holders, reducing macro and micro filtration time by over 50% and reducing sample loss due to inhibitive filtration times and insufficient gasket seals in alternative holders. The 30 primary sampling events were ultimately segregated by filtration and technical replicates into 294 filter subsamples and 424 DNA subsamples, with filters cut and used for replicate DNA extractions. With the final protocol detailed in <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>, we were able to produce all four filter fractions in as little as three hours for water with relatively low biomass, though this could be greatly reduced if processing smaller volumes. Filtrations could extend up to 10 hours in some cases when the collection volume was high (up to 60 liters) and/or the sampled substrate contained higher levels of biomass, such as during an algal bloom. Compared to similar methods used for the isolation of picocyanobacteria and cyanophages, such as flow cytometry, eDNA, density-gradient centrifugations, culturing, dilution to extinction, and titer plating, this protocol can be completed the same day as sampling with relatively inexpensive equipment, moderate processing volumes, and can be easily adapted for varying target organisms based on size. Additionally, this protocol can be used with sufficient preparation <italic>in-situ</italic> as well as in a laboratory setting for filtration processing, and produced multiple filter fraction samples that reduce sequencing noise in downstream applications. The 30 primary sampling events were ultimately segregated by filtration and technical replicates into 294 filter subsamples and 424 DNA subsamples, with filters cut and used for replicate DNA extractions.</p>
</sec>
<sec id="s3_2">
<title>Environmental metadata</title>
<p>As expected, we found that water temperatures increased at the entrance of Sequim Bay through summer months, peaking from late July to early August 2024, with lows in February 2025 (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>). The lowest recorded water temperature of the 26 sampling events from PNNL Sequim was 7.7 &#xb0;C on 2 January, 2024, and the highest recorded temperature was 14.7 &#xb0;C on 17 July, 2024. The sampling event at Cline Spit had the highest recorded temperature of 19.8 &#xb0;C on 7 August, 2024. The highest practical salinity value derived from the MCRL dock data was 32.1 on 18 August, 2024 and the lowest was 30.3 on 7 April, 2025. Surface sampling events occurred across a range of tidal events, ranging from -0.2 to 2.2 meters in water depth. Of all 30 sampling events, two were sampled during a slack low tide, three during a slack high tide, 17 during a flood tide, seven during an ebb tide, and one event from the Sequim outdoor mesocosm tank did not have an assigned tidal stage.</p>
</sec>
<sec id="s3_3">
<title>DNA yields under various conditions</title>
<p>DNA yields for various method and environmental context comparisons were statistically analyzed by using a Tukey&#x2019;s <italic>post hoc</italic> test (p &lt; 0.05) after performing an analysis of variance (ANOVA). Due to the highly limited sample sizes in some comparisons (as little as two in each group), these results can only be considered preliminary. Conclusions should be validated with further studies and greater sample sizes. The results for low sample size comparisons must be interpreted with caution, acknowledging that the impact of outliers or deviations may be amplified, and group variance and differences may not be accurately depicted.</p>
<p>In an exploratory controlled comparison of DNA yields, the Blood &amp; Tissue kit outperformed the PowerWater and PowerSoil kits, yielding approximately 3900, 690, and 2100 ng DNA, respectively (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>). For this controlled comparison, two pico filters (90mm PES) from a single sampling event were cut into thirds, and DNA was extracted from each third using a different kit (n = two extractions per kit). Samples labeled &#x201c;ab&#x201d; in <xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref> denote an overlap between groups a and b, indicating that DNA yields in these samples are not significantly different from either group a or group b, while groups a and b are significantly different from each other, as determined by a Tukey&#x2019;s <italic>post hoc</italic> test (p &lt; 0.05) after performing an analysis of variance (ANOVA). However, a &#x2018;kitchen sink&#x2019; comparison (a mix of conditions and replicates, controlling only for filter pore size and location) of each filter fraction across all DNA subsamples collected at PNNL-Sequim (macro, micro, pico, and viral) that also included the Zymo Plant/Seed kit (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>) resulted in highly variable yields under each condition such that there were no significant differences in the micro, pico, and viral fractions, and overlapping significance groups in the macro fraction. Yields in the three direct filter fractions (macro, micro, and pico) were on average relatively high (~500&#x2013;1000 ng or more), with a large proportion having acceptable yields for downstream sequencing (50 ng or greater; <xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>). This supports our approach of running filters to saturation to obtain sufficient material for DNA extraction. Perhaps unsurprisingly, the viral fractions had generally lower DNA yields, averaging 450 ng compared to an average of 1210, 1272, and 924 ng for the pico, micro, and macro fractions, respectively. However, viral DNA yields were often still high enough for sequencing.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Comparative DNA yields from different extraction kits: Blood &amp; Tissue Kit (BTK, purple), PowerSoil Kit (PSK, blue), and PowerWater Kit (PWK, green). DNA recovered (measured using a Qubit fluorometer) is shown for pico fractions (small micro) of a single sampling event on 26 August, 2024 during a high slack tide. Letters indicate significance groups as denoted by a Tukey&#x2019;s <italic>post hoc</italic> test (p &lt; 0.05) after performing an analysis of variance (ANOVA), while n=2 indicates sample size in each plot.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g005.tif">
<alt-text content-type="machine-generated">Boxplot comparing Qubit yield of DNA in nanograms for three kit types: BTK, PSK, and PWK. BTK shows the highest yield, PSK the lowest, and PWK an intermediate yield. Labels indicate significant differences using letters a, ab, and b, with sample size n equals two for each group. Colors differentiate kit types: purple for BTK, blue for PSK, and green for PWK.</alt-text>
</graphic></fig>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Kitchen sink comparison of DNA yields from different extraction kits for all filter fractions. DNA recovered (measured using a Qubit fluorometer) using the Blood &amp; Tissue Kit (BTK, purple), PowerSoil Kit (PSK, blue), PowerWater Kit (PWK, green), or Zymo Plant/Seed (ZPK, yellow) across all PNNL-Sequim sampling events. Filter fractions included in this figure are: macro (top left), micro (top right), pico (bottom left) and viral (bottom right) fractions. All conditions are labelled &#x201c;a&#x201d; indicating that there was only one significance group as denoted by a Tukey&#x2019;s <italic>post hoc</italic> test (p &lt; 0.05) after performing an ANOVA to determine the extraction kit had a significant impact on yield, and n indicates sample size in each plot. These results include all samples from all PNNL-Sequim sampling events, filter types, and dates over the year. Variable conditions are not taken into account in each test other than extraction method.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g006.tif">
<alt-text content-type="machine-generated">Four boxplot panels compare qubit yield of DNA in nanograms from different filter fractions (Macro, Micro, Pico, Viral) across kit types: BTK, PSK, PWK, and ZPK, with sample sizes labeled and PSK showing higher yield variability in most panels.</alt-text>
</graphic></fig>
<p>A similar kitchen sink comparison (controlling only for filter pore size and location) of MCE versus PES membranes also had high variation in yield. While the MCE membranes yielded slightly more DNA than the PES membranes for the pico fraction (1260 ng average for pico MCE and 1143 ng average for pico PES), the difference was insubstantial compared to the variation among samples (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7a</bold></xref>). In a more controlled, exploratory comparison of DNA yields from samples, the MCE membranes in the pico fraction were significantly greater than the PES membranes (p &lt; 0.05, 1818 and 1673 ng DNA, respectively), but the differences were small relative to the DNA yield (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7b</bold></xref>). Differences between PES and MCE in the viral fraction were also relatively small (324 ng difference in broad comparison, and 54 ng difference in focused comparison) and either were not significantly different or had overlapping significance groups based on a Tukey&#x2019;s <italic>post hoc</italic> test (p &lt; 0.05) after performing an ANOVA. Losses of yield when extracting DNA from filters after a long freezer storage period (over 100 days) were small and not significant (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>DNA yields for different filter types. DNA recovered for pico (green) and viral (blue) filter fractions obtained using PES filters (left in each subfigure), and MCE membrane filters (right in each subfigure). <bold>(A)</bold> Kitchen sink comparison of all filters collected from PNNL-Sequim or <bold>(B)</bold> focused comparison of filters collected from a seawater mesocosm tank on 3 December, 2024. Lowercase letters inside graph area indicate significance groups as denoted by a Tukey&#x2019;s post hoc test (p &gt; 0.05) after performing an ANOVA to determine if material and fraction had a significant impact on yield. Samples labeled &#x201c;ab&#x201d; denote an overlap between groups a and b, indicating that DNA yields in these samples are not significantly different from either group a or group b, while groups a and b are significantly different from each other.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g007.tif">
<alt-text content-type="machine-generated">Panel a presents a boxplot comparing qubit yield of DNA in nanograms for two filter materials, aPES and MCE, with two filter fractions: Pico greater than 0.22 micrometers and Viral less than 0.22 micrometers; sample sizes for each comparison are indicated and less than 5 micrometer. Panel b shows similar boxplots for a smaller sample size, comparing the same variables, with clear differences in DNA yield between filter materials and fractions.</alt-text>
</graphic></fig>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>DNA yield before and after extended freezer storage. DNA recovered (measured using a Qubit fluorometer), presented as ng/L <bold>(a)</bold>, and ng <bold>(b)</bold>, with extractions taking place either 5&#x2013;7 days after sampling (left plots within each figure) or 98 days after sampling (right plots within each figure). All data in this plot reflect DNA extracted from filters produced from a single sampling event on 31 July, 2024 extracted using the PowerSoil Kit and otherwise with the same processing methods. All conditions are labelled &#x201c;a&#x201d; indicating that there was only one significance group as denoted by a Tukey&#x2019;s <italic>post hoc</italic> test (p &lt; 0.05) after performing an ANOVA to determine if material and fraction had a significant impact on yield, and n indicates sample size in each plot.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g008.tif">
<alt-text content-type="machine-generated">Box plot figure containing two panels compares Qubit yield of DNA for two filter fractions, micro (greater than 5 micrometers) and pico (greater than 0.22 micrometers), over two periods in freezer, 5-7 and 98 days. Panel a shows DNA yield in nanograms per liter, and panel b shows yield in nanograms. Both panels have green and teal box plots, statistical annotations, and similar trends, with the legend at the bottom.</alt-text>
</graphic></fig>
<p>In-line serial filtration of the macro and micro fractions onto nylon and MCE membranes, respectively, using the Millipore Sigma polypropylene in-line filter holders (see Methods and <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Data Tables</bold></xref>) was observed to be the fastest method to remove larger-sized organisms, and facilitated large-volume processing in a laboratory while monitoring and changing out 20 &#xb5;m or 5 &#xb5;m filters if flow lessened as they became clogged. We note that for this reason the replicates for the 5 &#xb5;m filters are taken sequentially from the same sample flow through a single 20 &#xb5;m filter, and may differ based on differential coating, clogging, or disruption of the 20 &#xb5;m filter over that time series (see relative read counts section below). In contrast, the single-flask sterile PES filters were observed to be more time-efficient for pico and viral fractions than in-line filtration on an MCE membrane, reducing processing time per liter from over an hour to a matter of minutes in some cases. The larger (90 mm) filter size also allowed collection of quality technical replicates of DNA extraction and sequencing by cutting PES filters into equal fractions prior to freezing. A list of all yield data for samples used in these analyses can be found in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Data 3</bold></xref>.</p>
</sec>
<sec id="s3_4">
<title>Shotgun sequencing and relative read counts assigned to taxon groups</title>
<p>Read mapping results for four sites (PNNL-Sequim, John Wayne Marina, Cline Spit, and Discovery Bay) show that amoeba read counts were dramatically reduced between 3- and 30-fold after passage through 5 &#xb5;m to 0.22 &#xb5;m filters (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>), with the greatest fold reduction from the highest count 5 &#xb5;m filter (John Wayne Marina) and the least fold reduction from the lowest count 5 &#xb5;m filter (Cline Spit). In the Cline Spit sequences, there were only 287 reads from the 5 &#xb5;m filter that matched amoeba sequences. Although this indicates that large-bodied cells are effectively screened out, relative <italic>Prochlorococcus</italic> reads were not substantially increased or decreased in any of the 0.22 &#xb5;m filter samples, while relative <italic>Synechococcus</italic> reads were substantially reduced in some 0.22 &#xb5;m filter samples by up to a third (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Data 1</bold></xref>). <italic>Prochlorococcus</italic> normalized read counts were similar across sites and filters (range 718&#x2013;1300 per 10 M reads), indicating that substantial numbers are trapped by the larger filters and possibly that the differential filtering of larger cells is not enough to increase the relative enrichment of small cells on the subsequent filter; other possibilities are discussed below. The coefficient of variation among <italic>Prochlorococcus</italic> mean<italic>-</italic>normalized read counts for the <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref> technical replicates (replicates of all steps from filtration onwards) on the 0.22 &#xb5;m filters was also small at 6.8% (7.5%, 8.8%, and 5.0% for data in <xref ref-type="fig" rid="f9"><bold>Figures&#xa0;9a-c</bold></xref>, respectively). The <italic>Synechococcus</italic> read counts were also similar across samples and showed slightly higher reads than those of <italic>Prochlorococcus</italic> with the exception of Discovery Bay, in which the <italic>Synechococcus</italic> read counts were approximately 10-fold higher than at Cline Spit (<xref ref-type="fig" rid="f9"><bold>Figures&#xa0;9c, d</bold></xref>). The amoeba reads from the 5 &#xb5;m filters at Cline Spit and Discovery Bay, were about 50%-100% greater than <italic>Synechococcus</italic> reads at PNNL-Sequim and John Wayne Marina. The number of reads mapping to amoeba and <italic>Synechococcus</italic> fluctuate much more than reads mapping to <italic>Prochlorococcus</italic>, but they are not in sync with each other across sites. It is also notable that the 24-mer nonpareil sequence diversity measures across all sites (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9e</bold></xref>) were consistently higher and more variable in the 5 &#xb5;m filter fractions (range ~20.5-22.5) than the 0.22 &#xb5;m filter fractions (range ~19.5-20). The 5 &#xb5;m filters are thus at levels that are comparable to marine and soil samples (21-25) or freshwater and sandy soils (20-22) (<xref ref-type="bibr" rid="B44">Rodriguez-R et&#xa0;al., 2018</xref>), while the 0.22 &#xb5;m diversity is comparatively reduced.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Taxon assignments and sequence diversity measures across sampling locations. Sampling occurred in mid-late Summer 2024 at four sites <bold>(a)</bold> PNNL-Sequim 23 July 2024; <bold>(b)</bold> John Wayne Marina 31 July 2024; <bold>(c)</bold> Cline Spit 7 August 2024; and <bold>(d)</bold> Discovery Bay 14 August 2024. <bold>(e)</bold> Nonpareil 24-mer diversity measures (log scale) of the same samples shown in a-d, color-coded by site and sampling date as indicated in legend.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g009.tif">
<alt-text content-type="machine-generated">Five-panel scientific figure. Panels a-d display boxplots of Amoeba, Prochlorococcus, and Synechococcus read counts (per million) across filter fractions for dates 2024-07-23, 2024-07-31, 2024-08-07, and 2024-08-14. Panel e presents a scatter plot showing diversity against filter fraction, color-coded by date.</alt-text>
</graphic></fig>
<p><italic>Synechococcus</italic> read counts were remarkably similar at ebb and flood tides for both the 5 &#xb5;m and 0.22 &#xb5;m filters (<xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref>). In contrast, amoeba reads were about 3x less frequent at flood versus ebb tide on the 5 &#xb5;m filter and greatly reduced in frequency on the 0.22 &#xb5;m filters (<xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref>). <italic>Prochlorococcus</italic> reads were also reduced in flood versus ebb tides and were reduced by 50%-60% on the 0.22 &#xb5;m filter compared to the 5 &#xb5;m filter. We note that the flood tide samples were extracted considerably later than the ebb stage samples, but time stored in freezer prior to extraction was not expected to change relative frequencies based on our exploratory analysis showing no significant impact of freeze-time on yield (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>).</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>Taxon assignments of same-day samples collected at PNNL- PNNL at Ebb and Flood tides. All samples were collected on 31 July 2024 at dawn or midday (ebb and flood tides, respectively), filtered with 5 and 0.22 &#xb5;m MCE membrane filters and extracted with Qiagen PowerSoil kits. For readability, the magnitudes of the scales differ between the two filter pore sizes, with 5.0 &#xb5;m scale max 8000 reads per million and 0.22 &#xb5;m scale max 1500 reads per million. All conditions with multiple points are technical replicates of the process from sample collection and filtration through DNA extraction and sequencing process.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g010.tif">
<alt-text content-type="machine-generated">Panel a shows dot plots for Amoeba, Prochlorococcus, and Synechococcus with higher read counts during ebb for Amoeba and lower variation for others at 5 micrometers. Panel b shows box plots and dots for the same taxa, with generally lower read counts at 0.22 micrometers and distinct patterns between ebb and flood stages for each group. All graphs display reads per million versus tidal stage.</alt-text>
</graphic></fig>
<p>Relative frequencies of microbial taxa on the 0.22 &#xb5;m filters over time at PNNL-Sequim, which lasted from mid-April to late October 2024, are shown in <xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11</bold></xref>. These comparisons unavoidably included variation in tidal stage, and also in extraction method and time between collection and extraction, and are across a single year (see <xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11</bold></xref> legend), so must be interpreted in that context. As in previous figures, the amoeba reads are generally low, indicating relative exclusion by the 5 &#xb5;m filter. Amoeba and <italic>Prochlorococcus</italic> reads had high relative frequencies in early spring and late fall, indicating that they were relatively more frequent than other organisms in the filter sample). In contrast, <italic>Synechococcus</italic> counts were higher from April to October, with the exception of counts in July. Counts on July 17, 2024 were clustered by processing conditions for all three taxon groups, indicating that the combination of kit and time in freezer prior to extraction can affect results at nearly the same level of variation as change over time (PSK kit and short time in freezer had much higher counts). September 9, 2024 amoeba samples were strongly clustered by condition, with high relative counts for all samples with a short freezer storage duration and extracted with the PWK kit (the <italic>Prochlorococcus</italic> samples were also clustered in the same fashion). Across all three plots, DNA samples extracted within a few days of filtration had consistently clustered higher counts than samples extracted greater than 50 days after filtration (stored frozen and thawed). This suggests that extended freezer time may contribute to decreased identifiable sequence reads, yet our focused comparisons to assess the impact of freezer storage duration on DNA yield found no significant effect (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>).</p>
<fig id="f11" position="float">
<label>Figure&#xa0;11</label>
<caption>
<p>Diversity reads (per million) over six months in 2024 for all pico fraction samples from the PNNL-Sequim floating dock. PNNL-Sequim dock samples included samples from multiple sampling events, methods, kits, and dates over the year. 8 distinct sampling events on 8 different days are captured in this figure: April 15 (n = 2 DNA samples extracted with PSK 3 days after filtration), May 8 (n = 3 DNA samples extracted using PSK 5 days after filtration), July 17 (n = 4 DNA samples; 2 extracted using PSK 1 day after filtration, and 2 extracted using PWK 124 days after filtration), July 23 (n = 5 samples extracted using PSK 13 days after filtration), July 31 (n = 4 DNA samples extracted using PSK 5 days after filtration), August 26 (n = 1 DNA sample extracted using PWK 9 days after filtration), September 9 (n = 6 DNA samples; 3 extracted using PWK 2 days after sampling, and 3 extracted using PSK 58 days after filtration), and October 29, 2024 (n = 1 DNA sample extracted using PSK 8 days after sampling).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-13-1769457-g011.tif">
<alt-text content-type="machine-generated">Box plot graphic showing reads per million for Amoeba, Prochlorococcus, and Synechococcus in Sequim Bay throughout 2024, separated by tidal stages: ebb, flood, and slack high, with higher variability seen in some slack high and flood samples.</alt-text>
</graphic></fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>In this paper, we present and test the efficacy of a sampling approach to enrich taxonomic fractions by size exclusion filtration prior to targeted metagenomic shotgun sequencing. Our prior expectation was that organisms with cell sizes in the given size range would be enriched in the corresponding filter fraction, but that results would vary due to variable filter performance, variable cell-cell and cell-particle attachment frequencies among organisms, cell-free DNA, and horizontal gene transfer, especially involving viral particles. We define our sample fractions as macro (greater than 20 um), micro (5 to 20 um), pico (aka small micro, 0.2 to 5 um), and viral (less than 0.2 um), and sampling occurred in conjunction with abiotic metadata collection from the environment. Our final methodology balances material recovery, filter type and size, and collection speed. It incorporates a multi-step process: inline serial filtration through a combination of filters with sequentially smaller pore sizes, followed by single-flask filtration to capture various target organism size classes, followed by precipitation of viral particles in the filtrate from the smallest 0.22 &#xb5;m filters, which are expected to screen out nearly all intact cells. The final filter types were 20 &#xb5;m Millipore nylon filters, 5 &#xb5;m Millipore MCE membrane filters, and 0.22 &#xb5;m PES filters. By increasing the filter volume processed when there was little visible biological material, we successfully produced &#x2265; 50 ng of DNA in the majority of extractions, our minimal cutoff for sequencing submission. This required extensive filtration processing time of up to 3 hours for a single filter in some cases with higher biomass levels. All kit and filter types tested yielded sufficient DNA quantity and quality, and the more critical factors were processing time, cost, and material availability. While this protocol is advantageous for time-efficiency, material and equipment cost, and versatility in target organisms, other established methods such as eDNA sampling, culturing, and dilution to extinction may be better suited or used in conjunction with this protocol for applications that require axenic isolates, small samples, long-term cultivated strains, and/or if in-depth sequencing is not required.</p>
<p>The sequencing results presented in this paper were focused on exploratory (many conditions had small numbers or no replicates) statistical analysis to demonstrate detection of the picocyanobacteria genera <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic>, the times of year they were detectable, whether we could enrich the number of reads for these genera in the pico fractions, the technical repeatability of the results, and whether we could detect enrichment for sequences homologous to viruses that might be associated with picocyanobacteria in viral precipitate fractions. The clearest and perhaps most important sequencing result was that both <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> were detected in the Salish Sea samples, usually but not always with similar counts between them. <italic>Synechococcus</italic> was generally more common, especially in Discovery Bay which had dramatically higher <italic>Synechococcus</italic> counts per million. Detection of picocyanobacteria sequences is important because extraction of high-quality DNA from picocyanobacteria remains challenging primarily due to relatively low biomass collected in competitive and low-nutrient (oligotrophic) marine water (<xref ref-type="bibr" rid="B55">Wagner et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B21">Hept and Greene, 2023</xref>). Complicated by their potential inability to contribute proportionally as much to biomass in the more competitive and nutrient-rich estuarine waters of the Salish Sea. The relatively constant ratio of sequences from the two genera across sites and over the year is also important because of possible temperature, nutrient level, and virus interaction effects that at this latitude could have strongly affected their relative distributions (<xref ref-type="bibr" rid="B8">Carlson et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B9">Coello-Camba and Agust&#xed;, 2024</xref>; <xref ref-type="bibr" rid="B60">Zhang et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B62">Zufia et&#xa0;al., 2022</xref>). The validation of picocyanobacterial relative type abundance was essential because while some studies determined that picocyanobacteria are found in all regions of the euphotic zone, there is little research to validate these findings in the northern Pacific Ocean and specifically in the Salish Sea (<xref ref-type="bibr" rid="B2">Babi&#x107; et&#xa0;al., 2017</xref>). It is also notable, and important to establish, that the technical replicability (from filtering onwards) of the relative <italic>Prochlorococcus</italic> counts on the 0.22 &#xb5;m filters was high (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref> and throughout), allowing preliminary confidence in results differing by 10% or higher.</p>
<p>We note that although one viral sample had anomalously low counts, the top 5 viral samples have only 3.5x higher relative read counts (average 3417) than the remainder of the samples (average 882), indicating that a substantial amount of viral DNA is retained with the large-sized fractions. This may be due to particles or free DNA sticking to the filters, or to incorporation/infection or attachment to the cells that are stuck on those filters. We also note that phages derived from <italic>Synechococcus</italic> were the best matches to slightly over 50% of the cyanophage reads, although we caution against over-interpreting this result in terms of what types of organisms are infected with cyanophage, both because phages can often infect multiple species, and because the reference dataset contains many more <italic>Synechococcus</italic>-derived phages than cyanophages isolated from other organisms. Nevertheless, it is interesting that some of the highest read counts observed for <italic>Synechococcus</italic>-derived phages (2698, 2696, and 1240 respectively on the 20, 5 and 0.22 &#xb5;m filters from August 14, 2024 at Discovery Bay) were from samples with some of the highest <italic>Synechococcus</italic> genome read counts (respectively 15,251, 9653, and 7989).</p>
<p>Salinity and water temperature followed similar trends to each other, with slight increases during summer months and lows during cooler seasons. The slight changes in salinity across seasons are likely due to the heavy influence of rivers and precipitation in the estuary system, with increased outflow and precipitation in colder months that decrease salinity (<xref ref-type="bibr" rid="B56">Walker et&#xa0;al., 2022</xref>). Cline Spit&#x2019;s increased water temperature compared to PNNL-Sequim may be influenced by its location within Dungeness Bay, which is protected by a long spit that reduces water volume exchange and creates shallower sites. There are also large variances in the distance from the shore between sampling sites, which may inform differences between samples (e.g. sampling less than one meter from shore at Cline Spit, and greater than 50 meters from shore near Port Townsend).</p>
<p>The trends in relative frequencies of <italic>Prochlorococcus</italic>, <italic>Synechococcus</italic>, and amoeba-like sequences over the course of the year at PNNL Sequim (<xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11</bold></xref>) were somewhat surprising. Although the numbers were small, relative numbers of <italic>Prochlorococcus</italic> were highest towards the beginning of the year and decreased throughout the year, while <italic>Synechococcus</italic> numbers were lowest early in the year and then relatively constant. One might have thought that <italic>Prochlorococcus</italic>, which dominates at tropical and subtropical altitudes, would do comparatively better in the warmer months. Indeed, the highest counts were expected during the late spring and summer months (<xref ref-type="bibr" rid="B61">Zinser et&#xa0;al., 2006</xref>), so this may indicate that the estuarine dynamics of an inland sea are more unpredictable than expected. This trend was visible despite differences in tidal stage at time of sampling (which also impact relative counts, <xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref>). The trends in relative amoeba-like read counts (we remind readers that with only one amoeba sequence included, the phylogenetic definition of these sequences is poor) did not correspond to either of the picocyanobacteria, being most common in the earliest and latest months of the year sampled. Further definition of these trends will await results from planned sampling and sequencing across 2025 and 2026, and will particularly benefit from more detailed analysis of the relative frequency of sub-lineages within these broad taxonomic groups (i.e. at the species or ecotype level or below).</p>
<p>The relative read counts of various taxa under different filtration conditions were also unexpected. The amoeba-like sequences were more frequent on the 5 &#xb5;m filters than the 0.22 &#xb5;m filters, and combined with the relatively high nonpareil diversity on the 5 &#xb5;m filters, this indicated that the size exclusion filtration was effective. However, <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> relative read counts were not comparatively higher on the 0.22 &#xb5;m filters, and were fairly frequent in the viral fraction, which passed through the 0.22 &#xb5;m filters. Given these results, we may have been overly conservative in using 5 &#xb5;m filters (rather than, say, 2 &#xb5;m filters) to screen out large-bodied cells, but it also appears that considerable amounts of picocyanobacterial DNA both accumulated on the larger filters and passed through the smaller filters. Although free DNA and inadequacies of the filtration process need to be considered (e.g., high variability in pore size, micro breaks in filters, DNA or cell binding to filters as they pass through), it is possible that there are alternative explanations. Tycheposons, which are numerically common DNA-containing particles from <italic>Prochlorococcus</italic>, are emitted into the environment as particles similar to viruses (<xref ref-type="bibr" rid="B20">Hackl et&#xa0;al., 2023</xref>). These and other undiscovered elements in the taxa under study may strongly impact the filtration properties of DNA-containing objects. Higher-level conglomerates of cells or cell-particle mixes are now also recognized as important features of both <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic>, which would contribute to their retention on larger pore-size filters. Furthermore, viruses are commonly retained with infected cells, and due to gene transfer mechanisms both viruses and host targets can contain each other&#x2019;s genes. These sequencing features will also strongly benefit from more detailed analysis of the relative frequency of sub-lineages within these broad taxonomic groups, as well as detailed analysis of genomic regions that may be under- or over-sampled in different filter partitions.</p>
<sec id="s4_1">
<title>Technical challenges</title>
<p>The extraction of high-quality DNA from picocyanobacteria remains challenging, likely due to relatively low biomass collected in oligotrophic marine water, and potentially due to environmental contaminants, cell lysis inefficiencies due to cyanobacterial extracellular polymeric substances, and polysaccharide production (<xref ref-type="bibr" rid="B55">Wagner et&#xa0;al., 2024</xref>). Additionally, the consistently low biomass found at sampling sites&#x2014;excluding Cline Spit, which had much higher biological material than the other sampling sites&#x2014;necessitated high filtration volumes and extensive processing time.</p>
<p>The low sample size for many compared groups was a challenge to use for analyses and must be interpreted with caution. While ANOVA requires a minimum of one sample above the number of groups and can technically be performed under these conditions, it is not considered a sufficient sample size for statistical conclusions. We recognize that these results are only exploratory analyses to guide further research with larger sample sizes.</p>
<p>For our preliminary estimates, we used limited high-level estimates of sequence composition, and small numbers of technical replicates from identical samples (same time, location, and water sample with same filtration protocol). We also had few replicates of biological/environmental effects such as tidal state, time of year, or sampling location. Due to continuous sampling methodology adaptations throughout year one, there was high variation in sample production, which significantly decreased the number of quality technical replicates for focused comparisons. Especially for the non-controlled comparisons, results should be&#xa0;validated with larger sample sets and using consistent methods;&#xa0;however, the results presented here provide a valuable understanding of the impact that methodological variation can have.</p>
</sec>
</sec>
<sec id="s6" sec-type="conclusions">
<title>Conclusions</title>
<p>To address a gap of relatively rapid methods for isolating multiple target microorganisms from aqueous environments, we explored methods for consistent size-fractionated sampling and metadata collection. While this work was completed to support host-virus interaction studies influenced by environmental factors and to provide shareable, high-quality metadata for diverse applications, this work may also be useful in environmental DNA pre-filtration, ecosystem health monitoring, phytoplankton carbon cycling, harmful algal bloom detection, water quality assessments, metagenomics, single-cell genomics, aquaculture, algal anti-viral research, and fisheries management. By analyzing community composition, species, and ecotypes at the community level, as well as variations in host and phage genes, protein structures, and interactomes at the molecular level, this approach may inform phage-host co-evolution and viral-host interactions while reducing sequencing noise. This refined sampling and metadata production method for downstream analyses may also be useful in environmental DNA pre-filtration, ecosystem health monitoring, phytoplankton carbon cycling, harmful algal bloom detection, water quality assessments, metagenomics, single-cell genomics, aquaculture, algal anti-viral research, and fisheries management.</p>
<p>Using this refined sampling and metadata production method for downstream analyses, we were able to successfully produce sufficient DNA from multiple filter fractions to conduct preliminary metagenomic analyses in conjunction with environmental context over approximately a year. The processing time to produce four filter fractions for up to 60 liters of raw sample was reduced to as little as three hours in some cases, though processing time did increase with samples containing relatively high levels of biomass. While purifying enough DNA from marine aqueous environments for metagenomic applications is challenging, we were able to produce sufficient yields in all filter fractions, averaging 450, 1210, 1272, and 924 ng for the viral, pico, micro, and macro fractions. These results allowed us to conduct preliminary metagenomic analyses to investigate picocyanobacterial and viral dynamics in the Salish Sea.</p>
<p>In future work, more data should be collected using the final sampling scheme to generate larger sample sizes for more robust comparisons. This will produce valuable, standardized biological and physiochemical datasets to feed in-depth research applications such as evolutionary modeling of virus-host interactions. In addition, varying filter sizes may be helpful in refining the isolation and retention of target species in each fraction.</p>
<p>Finally, we considered additional experimental approaches to obtain more data on genetic aspects of the metagenomic samples, including RNA extraction and sequencing, individual cell and/or phage isolation and amplification in culture, and single cell sequencing, but concluded that these were not within our current budgetary constraints. These approaches would likely require further testing and modification of the protocol used to collect samples. Single cell sequencing or cell monoculture sequencing would likely have a tradeoff of fewer organisms sampled (leading to lower genetic diversity in sequencing results) for much better linkage information along the genome, while RNA sequencing in particular would reflect functional activity rather than just the presence of organisms measured in DNA sequencing. In future experiments with sufficient funding, adding these or similar types of approaches would be highly beneficial to better understand host-pathogen relationships, the ultimate aim of our research project.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material</bold></xref>.</p></sec>
<sec id="s8" sec-type="author-contributions">
<title>Author contributions</title>
<p>NB: Validation, Data curation, Resources, Visualization, Conceptualization, Methodology, Writing &#x2013; review &amp; editing, Supervision, Investigation, Formal analysis, Writing &#x2013; original draft. OL: Conceptualization, Writing &#x2013; review &amp; editing, Methodology, Data curation, Supervision. KJ: Data curation, Methodology, Investigation, Writing &#x2013; review &amp; editing. MP-F: Investigation, Methodology, Writing &#x2013; original draft, Data curation. DL: Software, Writing &#x2013; review &amp; editing, Visualization, Formal analysis. SC-T: Data curation, Methodology, Visualization, Formal&#xa0;analysis, Investigation, Writing &#x2013; original draft. PR: Formal analysis, Methodology, Visualization, Data curation, Writing &#x2013; review &amp; editing, Writing &#x2013; original draft, Software. RW: Data curation, Formal analysis, Writing &#x2013; original draft. CP: Writing &#x2013; review &amp; editing, Software, Visualization. MC: Project administration, Funding acquisition, Writing &#x2013; review &amp; editing, Supervision, Resources. CJ: Visualization, Writing &#x2013; review &amp; editing, Investigation, Project administration, Supervision, Formal analysis, Writing &#x2013; original draft, Data curation, Software. SE: Writing &#x2013; original draft, Resources, Writing &#x2013; review &amp; editing, Supervision, Methodology, Conceptualization. DP: Project administration, Conceptualization, Resources, Writing &#x2013; original draft, Formal analysis, Funding acquisition, Supervision, Writing &#x2013; review &amp; editing, Investigation.</p></sec>
<sec id="s10" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s11" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s12" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s13" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmars.2026.1769457/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmars.2026.1769457/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table1.xlsx" id="SF1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;1</label>
<caption>
<p>Peristaltic and Vacuum Pumps used in sampling method iteration.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table2.xlsx" id="SF2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;2</label>
<caption>
<p>Filter types tested for serial filtration optimization.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table3.xlsx" id="SF3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;3</label>
<caption>
<p>In-line filter holders tested for serial filtration optimization.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table4.xlsx" id="SF4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;4</label>
<caption>
<p>DNA Extraction kits used to test filter subsample DNA extraction optimization.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Table5.xlsx" id="SF5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"><label>Supplementary Table&#xa0;5</label>
<caption>
<p>Environmental metadata: acquisition methods distinguished by data acquired from MCRL Data at PNNL-Sequim or other locations.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Image1.jpg" id="SF6" mimetype="image/jpeg"><label>Supplementary Figure&#xa0;1</label>
<caption>
<p>TapeStation Data: DNA fragment analysis of 6 pico fraction samples and 1 viral fraction sample from parent sample NW_FE_024, sampled from Sequim Bay during a slack tide in September of 2024.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Image2.png" id="SF7" mimetype="image/png"><label>Supplementary Figure&#xa0;2</label>
<caption>
<p>Read alignment comparison for different cyanobacteria databases. The plots show good agreement between reads mapped using the NCBI-derived references used in the main manuscript and Prochlorococcus and Synechococcus references derived from the Cyanorak database. Each data point represents all sequences from a metagenomic sample. Red dashed line is the line y=x.</p>
</caption></supplementary-material>
<supplementary-material xlink:href="Image3.png" id="SF8" mimetype="image/png"><label>Supplementary Figure&#xa0;3</label>
<caption>
<p>Reads aligned to macroscopic reference strains across sample sequences. A range of reference strains demonstrate similar qualitative filtering behaviors across the sampling events, where the x-axis represents the sample sequences and y-axis the map read counts (per million). Amoeba (Chromosomes) and several marine diatoms common in the Salish Sea were chosen as a macroscopic reference for filter comparisons. Specific diatom strains considered were Skeletonema costatum strain CNS00243 (GCA_046619385.1), Chaetoceros tenuissimus strain NIES-3715 (GCA_021927905.1), Chaetoceros muelleri strain CCMP1316 (GCA_019693545.1), Thalassiosira oceanica strain CCMP1005 (GCA_019693575.1), Thalassiosira pacifica strain AJA261-08 (GCA_036939875.1).</p>
</caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.xlsx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="DataSheet2.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="DataSheet3.xlsx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="DataSheet4.xlsx" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Adams</surname> <given-names>C. I. M.</given-names></name>
<name><surname>Knapp</surname> <given-names>M.</given-names></name>
<name><surname>Gemmell</surname> <given-names>N. J.</given-names></name>
<name><surname>Jeunen</surname> <given-names>G. J.</given-names></name>
<name><surname>Bunce</surname> <given-names>M.</given-names></name>
<name><surname>Lamare</surname> <given-names>M. D.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Beyond biodiversity: can environmental DNA (eDNA) cut it as a population genetics tool</article-title>? <source>Genes</source> <volume>10</volume>, <elocation-id>192</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/genes10030192</pub-id>, PMID: <pub-id pub-id-type="pmid">30832286</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Babi&#x107;</surname> <given-names>I.</given-names></name>
<name><surname>Petri&#x107;</surname> <given-names>I.</given-names></name>
<name><surname>Bosak</surname> <given-names>Sun&#x10d;ica</given-names></name>
<name><surname>Mihanovi&#x107;</surname> <given-names>H.</given-names></name>
<name><surname>Radi&#x107;</surname> <given-names>I. Dup&#x10d;i&#x107;</given-names></name>
<name><surname>Ljube&#x161;i&#x107;</surname> <given-names>Z.</given-names></name>
</person-group> (<year>2017</year>). &#x201c;
<article-title>Distribution and Diversity of Marine Picocyanobacteria Community: Targeting of <italic>Prochlorococcus</italic> Ecotypes in Winter Conditions (Southern Adriatic Sea)</article-title>,&#x201d; in <source>Marine Genomics, Navigating the Future: Cross-sector Marine Genomics</source>, <publisher-loc>(Amsterdam, Netherlands</publisher-loc>: 
<publisher-name>Elsevier</publisher-name>), vol. <volume>36</volume>, <fpage>3</fpage>&#x2013;<lpage>11</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.margen.2017.05.014</pub-id>, PMID: <pub-id pub-id-type="pmid">28595872</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="web">
<person-group person-group-type="author"><collab>Babraham Institute</collab>
</person-group> (<year>2023</year>). <source>Babraham Bioinformatics - FastQC A Quality Control Tool for High Throughput Sequence Data</source>. Available online at: <uri xlink:href="https://www.bioinformatics.babraham.ac.uk/projects/fastqc/">https://www.bioinformatics.babraham.ac.uk/projects/fastqc/</uri> (Accessed <date-in-citation content-type="access-date">November 5, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Buchholz</surname> <given-names>H. H.</given-names></name>
<name><surname>Michelsen</surname> <given-names>M. L.</given-names></name>
<name><surname>Bola&#xf1;os</surname> <given-names>L. M.</given-names></name>
<name><surname>Browne</surname> <given-names>E.</given-names></name>
<name><surname>Allen</surname> <given-names>M. J.</given-names></name>
<name><surname>Temperton</surname> <given-names>B.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Efficient Dilution-to-extinction isolation of novel virus&#x2013;host model systems for fastidious heterotrophic Bacteria</article-title>. <source>ISME J.</source> <volume>15</volume>, <fpage>1585</fpage>&#x2013;<lpage>1598</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41396-020-00872-z</pub-id>, PMID: <pub-id pub-id-type="pmid">33495565</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Bushnell</surname> <given-names>B.</given-names></name>
</person-group> (<year>2014</year>). &#x201c;
<article-title>BBMap: A Fast, Accurate, Splice-Aware Aligner</article-title>,&#x201d; in <source>LBNL-7065E</source>. <publisher-loc>(Berkeley, California, United States</publisher-loc>: 
<publisher-name>LBL Publications</publisher-name>). Available online at: <uri xlink:href="https://escholarship.org/uc/item/1h3515gn">https://escholarship.org/uc/item/1h3515gn</uri> (Accessed <date-in-citation content-type="access-date">November 20, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bushnell</surname> <given-names>B.</given-names></name>
<name><surname>Rood</surname> <given-names>J.</given-names></name>
<name><surname>Singer</surname> <given-names>E.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>BBMerge - accurate paired shotgun read merging via overlap</article-title>. <source>PloS One</source> <volume>12</volume>, <fpage>e0185056</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0185056</pub-id>, PMID: <pub-id pub-id-type="pmid">29073143</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Callieri</surname> <given-names>C.</given-names></name>
<name><surname>Cabello-Yeves</surname> <given-names>P. J.</given-names></name>
<name><surname>Bertoni</surname> <given-names>F.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>The &#x2018;Dark side&#x2019; of picocyanobacteria: life as we do not know it (Yet)</article-title>. <source>Microorganisms</source> <volume>10</volume>, <elocation-id>546</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/microorganisms10030546</pub-id>, PMID: <pub-id pub-id-type="pmid">35336120</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Carlson</surname> <given-names>C. J.</given-names></name>
<name><surname>Albery</surname> <given-names>G. F.</given-names></name>
<name><surname>Merow</surname> <given-names>C.</given-names></name>
<name><surname>Trisos</surname> <given-names>C. H.</given-names></name>
<name><surname>Zipfel</surname> <given-names>C. M.</given-names></name>
<name><surname>Eskew</surname> <given-names>E. A.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Climate change increases cross-species viral transmission risk</article-title>. <source>Nature</source> <volume>607</volume>, <fpage>555</fpage>&#x2013;<lpage>562</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-022-04788-w</pub-id>, PMID: <pub-id pub-id-type="pmid">35483403</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Coello-Camba</surname> <given-names>A.</given-names></name>
<name><surname>Agust&#xed;</surname> <given-names>S.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Seawater temperature drives the diversity of key cyanobacteria (<italic>Synechococcus</italic> and <italic>Prochlorococcus</italic>) in a warming sea</article-title>. <source>Front. Mar. Sci.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2024.1456799</pub-id>, PMID: <pub-id pub-id-type="pmid">41717471</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Del Bel Belluz</surname> <given-names>J.</given-names></name>
<name><surname>Jackson</surname> <given-names>J. M.</given-names></name>
<name><surname>Kellogg</surname> <given-names>C. T.E.</given-names></name>
<name><surname>Pe&#xf1;a</surname> <given-names>M.A.</given-names></name>
<name><surname>Giesbrecht</surname> <given-names>I. J.W.</given-names></name>
<name><surname>Hobson</surname> <given-names>L. A.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Phytoplankton community composition links to environmental drivers across a fjord to shelf gradient on the central coast of british columbia</article-title>. <source>Front. Mar. Sci.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2024.1458677</pub-id>, PMID: <pub-id pub-id-type="pmid">41717471</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Dorigatti</surname> <given-names>I.</given-names></name>
<name><surname>Gaythorpe</surname> <given-names>K. A.M.</given-names></name>
<name><surname>Cox</surname> <given-names>V. M.</given-names></name>
<name><surname>Windram</surname> <given-names>F. A.</given-names></name>
<name><surname>Cator</surname> <given-names>L.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Priorities for modelling arbovirus transmission under climate change</article-title>. <source>Trends Mol. Med.</source> <volume>31</volume>, <fpage>885</fpage>&#x2013;<lpage>894</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.molmed.2025.05.010</pub-id>, PMID: <pub-id pub-id-type="pmid">40527633</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="web">
<person-group person-group-type="author"><collab>EcoKMER GitHub Software Repository</collab>
</person-group> (<year>2025</year>). Available online at: <uri xlink:href="https://github.com/NWBRaVE/EcoKMER">https://github.com/NWBRaVE/EcoKMER</uri> (Accessed <date-in-citation content-type="access-date">October 21, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Edmundson</surname> <given-names>S.</given-names></name>
<name><surname>Huesemann</surname> <given-names>M.</given-names></name>
<name><surname>Cady</surname> <given-names>S.</given-names></name>
<name><surname>Kuo</surname> <given-names>L.-J.</given-names></name>
<name><surname>Anderson</surname> <given-names>B.</given-names></name>
<name><surname>Reynolds</surname> <given-names>D.</given-names></name>
</person-group> (<year>2020</year>). <source>VITAL-viral inhibiTors from ALgae: generating extracts for antiviral activity assays</source>. <publisher-loc>(Alexandria, Virginia, United States</publisher-loc>: 
<publisher-name>National Technical Information Service),</publisher-name> <fpage>1776864</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2172/1776864</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Flombaum</surname> <given-names>P.</given-names></name>
<name><surname>Gallegos</surname> <given-names>J. L.</given-names></name>
<name><surname>Gordillo</surname> <given-names>R. A.</given-names></name>
<name><surname>Rincon</surname> <given-names>J.</given-names></name>
<name><surname>Zabala</surname> <given-names>L. L.</given-names></name>
<name><surname>Jiao</surname> <given-names>N.</given-names></name>
<etal/>
</person-group>. (<year>2013</year>). 
<article-title>Present and future global distributions of the marine cyanobacteria <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic></article-title>. <source>Proc. Natl. Acad. Sci. Unit States America</source> <volume>110</volume>, <fpage>9824</fpage>&#x2013;<lpage>9829</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1307701110</pub-id>, PMID: <pub-id pub-id-type="pmid">23703908</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Flombaum</surname> <given-names>P.</given-names></name>
<name><surname>Wang</surname> <given-names>W.-L.</given-names></name>
<name><surname>Primeau</surname> <given-names>F. W.</given-names></name>
<name><surname>Martiny</surname> <given-names>A. C.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>Global picophytoplankton niche partitioning predicts overall positive response to ocean warming</article-title>. <source>Nat. Geosci.</source> <volume>13</volume>, <fpage>116</fpage>&#x2013;<lpage>120</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41561-019-0524-2</pub-id>, PMID: <pub-id pub-id-type="pmid">41714676</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fuchsman</surname> <given-names>C. A.</given-names></name>
<name><surname>Hays</surname> <given-names>M. D.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Increased cyanophage infection at the bottom of the euphotic zone, especially in the fall</article-title>. <source>Environ. Microbiol.</source> <volume>25</volume>, <fpage>3349</fpage>&#x2013;<lpage>3363</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/1462-2920.16525</pub-id>, PMID: <pub-id pub-id-type="pmid">37861083</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Garczarek</surname> <given-names>L.</given-names></name>
<name><surname>Guyet</surname> <given-names>U.</given-names></name>
<name><surname>Dor&#xe9;</surname> <given-names>H.</given-names></name>
<name><surname>Farrant</surname> <given-names>G. K.</given-names></name>
<name><surname>Hoebeke</surname> <given-names>M.</given-names></name>
<name><surname>Brillet-Gu&#xe9;guen</surname> <given-names>L.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>Cyanorak v2.1: A scalable information system dedicated to the visualization and expert curation of marine and brackish picocyanobacteria genomes</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>D667</fpage>&#x2013;<lpage>D676</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkaa958</pub-id>, PMID: <pub-id pub-id-type="pmid">33125079</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>George</surname> <given-names>A.</given-names></name>
<name><surname>Leach</surname> <given-names>D.</given-names></name>
<name><surname>Philips</surname> <given-names>C.</given-names></name>
<name><surname>Brown</surname> <given-names>J.</given-names></name>
<name><surname>Duncan</surname> <given-names>J. M.</given-names></name>
<name><surname>Nedved</surname> <given-names>B.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>EcoKMER: one-stop shop for spatio-temporal metagenomic exploration using dataFed</article-title>. <source>bioRxiv</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.64898/2025.12.15.694490</pub-id>, PMID: <pub-id pub-id-type="pmid">41453657</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gurevich</surname> <given-names>A.</given-names></name>
<name><surname>Saveliev</surname> <given-names>V.</given-names></name>
<name><surname>Vyahhi</surname> <given-names>N.</given-names></name>
<name><surname>Tesler</surname> <given-names>G.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>QUAST: quality assessment tool for genome assemblies</article-title>. <source>Bioinf. (Oxf Engl)</source> <volume>29</volume>, <fpage>1072</fpage>&#x2013;<lpage>1075</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btt086</pub-id>, PMID: <pub-id pub-id-type="pmid">23422339</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hackl</surname> <given-names>T.</given-names></name>
<name><surname>Laurenceau</surname> <given-names>R.</given-names></name>
<name><surname>Ankenbrand</surname> <given-names>M. J.</given-names></name>
<name><surname>Bliem</surname> <given-names>C.</given-names></name>
<name><surname>Cariani</surname> <given-names>Z.</given-names></name>
<name><surname>Thomas</surname> <given-names>E.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Novel integrative elements and genomic plasticity in ocean ecosystems</article-title>. <source>Cell</source> <volume>186</volume>, <fpage>47</fpage>&#x2013;<lpage>62.e16</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2022.12.006</pub-id>, PMID: <pub-id pub-id-type="pmid">36608657</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hept</surname> <given-names>M. A.</given-names></name>
<name><surname>Greene</surname> <given-names>L. H.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Extracting high-molecular weight DNA from cyanobacteria using promega&#x2019;s wizard&#x24c7; HMW DNA extraction kit with a modified protocol, METIS</article-title>. <source>MethodsX</source> <volume>11</volume>, <elocation-id>102341</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.mex.2023.102341</pub-id>, PMID: <pub-id pub-id-type="pmid">37732290</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="web">
<person-group person-group-type="author">
<name><surname>Hill</surname> <given-names>T.</given-names></name>
<name><surname>cre</surname></name>
<name><surname>Anisfeld</surname> <given-names>S.</given-names></name>
</person-group> (<year>2021</year>). <source>VulnToolkit: analysis of tidal datasets</source>. Available online at: <uri xlink:href="https://cran.r-project.org/web/packages/VulnToolkit/index.html">https://cran.r-project.org/web/packages/VulnToolkit/index.html</uri> (Accessed <date-in-citation content-type="access-date">November 1, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hshieh</surname> <given-names>K.</given-names></name>
<name><surname>Maloney</surname> <given-names>J. G.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Sequencing on the edge: tools and techniques for sequencing low biomass isolates from unicellular eukaryotic parasites and other challenging samples</article-title>. <source>J. Microbiol Methods</source> <volume>237</volume>, <elocation-id>107233</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.mimet.2025.107233</pub-id>, PMID: <pub-id pub-id-type="pmid">40846080</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Huang</surname> <given-names>Z.</given-names></name>
<name><surname>Fang</surname> <given-names>F.</given-names></name>
<name><surname>Ding</surname> <given-names>L.</given-names></name>
<name><surname>Yu</surname> <given-names>Ke</given-names></name>
<name><surname>Zhang</surname> <given-names>L.</given-names></name>
<name><surname>Lu</surname> <given-names>H.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Technological advancements in field investigations of marine microorganisms: from sampling strategies to molecular analyses</article-title>. <source>J. Mar. Sci. Eng.</source> <volume>11</volume>, <elocation-id>1981</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jmse11101981</pub-id>, PMID: <pub-id pub-id-type="pmid">41700957</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>John</surname> <given-names>S. G.</given-names></name>
<name><surname>Mendez</surname> <given-names>C. B.</given-names></name>
<name><surname>Deng</surname> <given-names>L.</given-names></name>
<name><surname>Poulos</surname> <given-names>B.</given-names></name>
<name><surname>Kauffman</surname> <given-names>A. K. M.</given-names></name>
<name><surname>Kern</surname> <given-names>S.</given-names></name>
<etal/>
</person-group>. (<year>2011</year>). 
<article-title>A simple and efficient method for concentration of ocean viruses by chemical flocculation</article-title>. <source>Environ. Microbiol. Rep.</source> <volume>3</volume>, <fpage>195</fpage>&#x2013;<lpage>202</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1758-2229.2010.00208.x</pub-id>, PMID: <pub-id pub-id-type="pmid">21572525</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Karamati</surname> <given-names>N</given-names></name>
<name><surname>Elnaz</surname></name>
<name><surname>Law</surname> <given-names>I.</given-names></name>
<name><surname>Weese</surname> <given-names>J.S.</given-names></name>
<name><surname>McCarthy</surname> <given-names>D. T.</given-names></name>
<name><surname>Murphy</surname> <given-names>H. M.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Passive sampling of microbes in various water sources: A systematic review</article-title>. <source>Water Res.</source> <volume>266</volume>, <elocation-id>122284</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.watres.2024.122284</pub-id>, PMID: <pub-id pub-id-type="pmid">39353231</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kearney</surname> <given-names>S. M.</given-names></name>
<name><surname>Coe</surname> <given-names>A.</given-names></name>
<name><surname>Castro</surname> <given-names>K. G.</given-names></name>
<name><surname>Chisholm</surname> <given-names>S. W.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Filter plating method for rendering picocyanobacteria cultures free of heterotrophic bacterial contaminants and clonal</article-title>. <source>Front. Microbiol.</source> <volume>13</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2022.821803</pub-id>, PMID: <pub-id pub-id-type="pmid">35250937</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kent</surname> <given-names>A. G.</given-names></name>
<name><surname>Baer</surname> <given-names>S. E.</given-names></name>
<name><surname>Mouginot</surname> <given-names>C.</given-names></name>
<name><surname>Huang</surname> <given-names>J.</given-names></name>
<name><surname>Larkin</surname> <given-names>A.</given-names></name>
<name><surname>Lomas</surname> <given-names>M. W.</given-names></name>
<etal/>
</person-group>. (<year>2019</year>). 
<article-title>Parallel phylogeography of <italic>Prochlorococcus</italic> and <italic>Synechococcus</italic></article-title>. <source>ISME J.</source> <volume>13</volume>, <fpage>430</fpage>&#x2013;<lpage>441</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41396-018-0287-6</pub-id>, PMID: <pub-id pub-id-type="pmid">30283146</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Lawrence</surname> <given-names>J. E.</given-names></name>
<name><surname>Steward</surname> <given-names>G. F.</given-names></name>
</person-group> (<year>2010</year>). &#x201c;
<article-title>Purification of viruses by centrifugation</article-title>,&#x201d; in <source>Manual of aquatic viral ecology</source>. Eds. 
<person-group person-group-type="editor">
<name><surname>Wilhelm</surname> <given-names>S.</given-names></name>
<name><surname>Weinbauer</surname> <given-names>M.</given-names></name>
<name><surname>Suttle</surname> <given-names>C.</given-names></name>
</person-group> (<publisher-loc>Waco, Texas, United States</publisher-loc>: 
<publisher-name>American Society of Limnology and Oceanography</publisher-name>). doi:&#xa0;<pub-id pub-id-type="doi">10.4319/mave.2010.978-0-9845591-0-7.166</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>D.</given-names></name>
<name><surname>Liu</surname> <given-names>C.-M.</given-names></name>
<name><surname>Luo</surname> <given-names>R.</given-names></name>
<name><surname>Sadakane</surname> <given-names>K.</given-names></name>
<name><surname>Lam</surname> <given-names>T.-W.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>MEGAHIT: An Ultra-Fast Single-Node Solution for Large and Complex Metagenomics Assembly via Succinct de Bruijn Graph</article-title>. <source>Bioinf. (Oxf Engl)</source> <volume>31</volume>, <fpage>1674</fpage>&#x2013;<lpage>1676</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btv033</pub-id>, PMID: <pub-id pub-id-type="pmid">25609793</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>R.</given-names></name>
<name><surname>Liu</surname> <given-names>Y.</given-names></name>
<name><surname>Chen</surname> <given-names>Y.</given-names></name>
<name><surname>Zhan</surname> <given-names>Y.</given-names></name>
<name><surname>Zeng</surname> <given-names>Q.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Cyanobacterial viruses exhibit diurnal rhythms during infection</article-title>. <source>Proc. Natl. Acad. Sci. Unit States America</source> <volume>116</volume>, <fpage>14077</fpage>&#x2013;<lpage>14082</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1819689116</pub-id>, PMID: <pub-id pub-id-type="pmid">31235591</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lu</surname> <given-names>J.</given-names></name>
<name><surname>Rincon</surname> <given-names>N.</given-names></name>
<name><surname>Wood</surname> <given-names>D. E.</given-names></name>
<name><surname>Breitwieser</surname> <given-names>F. P.</given-names></name>
<name><surname>Pockrandt</surname> <given-names>C.</given-names></name>
<name><surname>Langmead</surname> <given-names>B.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Metagenome analysis using the kraken software suite</article-title>. <source>Nat. Protoc.</source> <volume>17</volume>, <fpage>2815</fpage>&#x2013;<lpage>2839</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41596-022-00738-y</pub-id>, PMID: <pub-id pub-id-type="pmid">36171387</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="book">
<person-group person-group-type="author"><collab>Marine and Coastal Research Laboratory</collab>
</person-group> (<year>2025</year>). &#x201c;
<article-title>Outdoor Experimental Tanks at PNNL-Sequim</article-title>,&#x201d; in <source>Pacific northwest national laboratory</source>. <publisher-loc>(Richland Washington, United Stated</publisher-loc>: 
<publisher-name>Pacific Northwest National Laboratory</publisher-name>). Available online at: <uri xlink:href="https://www.pnnl.gov/outdoor-experimental-tanks-pnnl-sequim">https://www.pnnl.gov/outdoor-experimental-tanks-pnnl-sequim</uri> (Accessed <date-in-citation content-type="access-date">December 1, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="web">
<person-group person-group-type="author"><collab>MCRL Data</collab>
</person-group> (<year>2025</year>). <source>Marine and coastal research laboratory data</source>. Available online at: <uri xlink:href="https://mcrldata.pnnl.gov/">https://mcrldata.pnnl.gov/</uri> (Accessed <date-in-citation content-type="access-date">December 1, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="web">
<person-group person-group-type="author"><collab>MCRLdata Sandbox</collab>
</person-group> (<year>2025</year>a). <source>MCRLData-sandbox CTD</source>. Available online at: <uri xlink:href="https://github.com/MCRLdata-Sandbox/data_prep/blob/main/data/outputs/L1/250815_ctd_water_temp_salinity_L1.csv">https://github.com/MCRLdata-Sandbox/data_prep/blob/main/data/outputs/L1/250815_ctd_water_temp_salinity_L1.csv</uri> (Accessed <date-in-citation content-type="access-date">December 1, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="web">
<person-group person-group-type="author"><collab>MCRLdata Sandbox</collab>
</person-group> (<year>2025</year>b). <source>MCRLdata-sandbox tide gauge</source>. Available online at: <uri xlink:href="https://github.com/MCRLdata-Sandbox/data_prep/blob/main/data/outputs/L1/250515_tidegauge_L1.csv">https://github.com/MCRLdata-Sandbox/data_prep/blob/main/data/outputs/L1/250515_tidegauge_L1.csv</uri> (Accessed <date-in-citation content-type="access-date">December 1, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mehdizadeh Allaf</surname> <given-names>M.</given-names></name>
<name><surname>Peerhossaini</surname> <given-names>H.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Cyanobacteria: model microorganisms and beyond</article-title>. <source>Microorganisms</source> <volume>10</volume>, <elocation-id>696</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/microorganisms10040696</pub-id>, PMID: <pub-id pub-id-type="pmid">35456747</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mella-Flores</surname> <given-names>D. M.</given-names></name>
<name><surname>Six</surname> <given-names>C.</given-names></name>
<name><surname>Ratin</surname> <given-names>M.</given-names></name>
<name><surname>Partensky</surname> <given-names>F.</given-names></name>
<name><surname>Boutte</surname> <given-names>C.</given-names></name>
<name><surname>Le Corguill&#xe9;</surname> <given-names>G.</given-names></name>
<etal/>
</person-group>. (<year>2012</year>). 
<article-title><italic>Prochlorococcus</italic> and <italic>Synechococcus</italic> have evolved different adaptive mechanisms to cope with light and UV stress</article-title>. <source>Front. Microbiol.</source> <volume>3</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2012.00285</pub-id>, PMID: <pub-id pub-id-type="pmid">23024637</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mioduchowska</surname> <given-names>M.</given-names></name>
<name><surname>Paw&#x142;owska</surname> <given-names>J.</given-names></name>
<name><surname>Mazanowski</surname> <given-names>K.</given-names></name>
<name><surname>Weydmann-Zwolicka</surname> <given-names>A.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Contrasting marine microbial communities of the fram strait with the first confirmed record of cyanobacteria <italic>Prochlorococcus marinus</italic> in the arctic region</article-title>. <source>Biology</source> <volume>12</volume>, <elocation-id>1246</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/biology12091246</pub-id>, PMID: <pub-id pub-id-type="pmid">37759645</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="book">
<person-group person-group-type="author"><collab>National Microbiome Data Collaborative</collab>
</person-group> (<year>2026</year>). <source>The NMDC metadata standards documentation</source> (
<publisher-name>Github. Inc: National Microbiome Data Collaborative</publisher-name>). Available online at: <uri xlink:href="https://microbiomedata.github.io/nmdc-schema/Metadata_Documentation_Overview/">https://microbiomedata.github.io/nmdc-schema/Metadata_Documentation_Overview/</uri> (Accessed <date-in-citation content-type="access-date">October 28, 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="book">
<person-group person-group-type="author"><collab>NOAA Tides and Currents</collab>
</person-group> (<year>2025</year>). <source>Port Angeles, WA - Station ID: 9444090, National Oceanic and Atmospheric Administration</source>. Available online at: <uri xlink:href="https://tidesandcurrents.noaa.gov/stationhome.html?id=9444090">https://tidesandcurrents.noaa.gov/stationhome.html?id=9444090</uri> (Accessed <date-in-citation content-type="access-date">August 2025</date-in-citation>).
</mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Reynolds</surname> <given-names>D.</given-names></name>
<name><surname>Huesemann</surname> <given-names>M.</given-names></name>
<name><surname>Edmundson</surname> <given-names>S.</given-names></name>
<name><surname>Sims</surname> <given-names>A.</given-names></name>
<name><surname>Hurst</surname> <given-names>B.</given-names></name>
<name><surname>Cady</surname> <given-names>S.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>Viral inhibitors derived from macroalgae, microalgae, and cyanobacteria: A review of antiviral potential throughout pathogenesis</article-title>. <source>Algal Res.</source> <volume>57</volume>, <elocation-id>102331</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.algal.2021.102331</pub-id>, PMID: <pub-id pub-id-type="pmid">34026476</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ribalet</surname> <given-names>Fran&#xe7;ois</given-names></name>
<name><surname>Dutkiewicz</surname> <given-names>S.</given-names></name>
<name><surname>Monier</surname> <given-names>E.</given-names></name>
<name><surname>Armbrust</surname> <given-names>E.V.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Future ocean warming may cause large reductions in <italic>Prochlorococcus</italic> biomass and productivity</article-title>. <source>Nat. Microbiol.</source> <volume>10</volume>, <fpage>2441</fpage>&#x2013;<lpage>2453</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41564-025-02106-4</pub-id>, PMID: <pub-id pub-id-type="pmid">40921743</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rodriguez-R</surname> <given-names>L. M.</given-names></name>
<name><surname>Gunturu</surname> <given-names>S.</given-names></name>
<name><surname>Tiedje</surname> <given-names>J. M.</given-names></name>
<name><surname>Cole</surname> <given-names>J. R.</given-names></name>
<name><surname>Konstantinidis</surname> <given-names>K. T.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Nonpareil 3: fast estimation of metagenomic coverage and sequence diversity</article-title>. <source>mSystems</source> <volume>3</volume>, <fpage>e00039</fpage>&#x2013;<lpage>e00018</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/mSystems.00039-18</pub-id>, PMID: <pub-id pub-id-type="pmid">29657970</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rong</surname> <given-names>C.</given-names></name>
<name><surname>Zhou</surname> <given-names>K.</given-names></name>
<name><surname>Li</surname> <given-names>S.</given-names></name>
<name><surname>Xiao</surname> <given-names>K.</given-names></name>
<name><surname>Xu</surname> <given-names>Y.</given-names></name>
<name><surname>Zhang</surname> <given-names>R.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Isolation and characterization of a novel cyanophage encoding multiple auxiliary metabolic genes</article-title>. <source>Viruses</source> <volume>14</volume>, <elocation-id>887</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/v14050887</pub-id>, PMID: <pub-id pub-id-type="pmid">35632629</pub-id>
</mixed-citation>
</ref>
<ref id="B46">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rozum</surname> <given-names>J. C.</given-names></name>
<name><surname>Sineath</surname> <given-names>W.</given-names></name>
<name><surname>Bohutskyi</surname> <given-names>P.</given-names></name>
<name><surname>Quenneville</surname> <given-names>J.</given-names></name>
<name><surname>Kim</surname> <given-names>D. N.</given-names></name>
<name><surname>Johnson</surname> <given-names>C.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Synergy and antagonism in a genome-scale model of metabolic hijacking by bacteriophages</article-title>. <source>bioRxiv</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2024.12.11.628001</pub-id>, PMID: <pub-id pub-id-type="pmid">41723302</pub-id>
</mixed-citation>
</ref>
<ref id="B47">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ruber</surname> <given-names>J.</given-names></name>
<name><surname>Geist</surname> <given-names>J.</given-names></name>
<name><surname>Hartmann</surname> <given-names>M.</given-names></name>
<name><surname>Millard</surname> <given-names>A. D.</given-names></name>
<name><surname>Raeder</surname> <given-names>U.</given-names></name>
<name><surname>Zubkov</surname> <given-names>M. V.</given-names></name>
<etal/>
</person-group>. (<year>2018</year>). 
<article-title>Spatio-temporal distribution pattern of the picocyanobacterium <italic>Synechococcus</italic> in lakes of different trophic states: A comparison of flow cytometry and sequencing approaches</article-title>. <source>Hydrobiologia</source> <volume>811</volume>, <fpage>77</fpage>&#x2013;<lpage>92</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10750-017-3368-z</pub-id>, PMID: <pub-id pub-id-type="pmid">41721156</pub-id>
</mixed-citation>
</ref>
<ref id="B48">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sahu</surname> <given-names>A.</given-names></name>
<name><surname>Singh</surname> <given-names>M.</given-names></name>
<name><surname>Amin</surname> <given-names>A.</given-names></name>
<name><surname>Malik</surname> <given-names>M. M.</given-names></name>
<name><surname>Qadiri</surname> <given-names>S. S. N.</given-names></name>
<name><surname>Abubakr</surname> <given-names>A.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>A systematic review on environmental DNA (eDNA) science: an eco-friendly survey method for conservation and restoration of fragile ecosystems</article-title>. <source>Ecol. Indic.</source> <volume>173</volume>, <elocation-id>113441</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ecolind.2025.113441</pub-id>, PMID: <pub-id pub-id-type="pmid">41723091</pub-id>
</mixed-citation>
</ref>
<ref id="B49">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>S&#xe1;nchez-Gallego</surname> <given-names>J.</given-names></name>
<name><surname>Curtis</surname> <given-names>N. P.</given-names></name>
<name><surname>Paerl</surname> <given-names>H. W.</given-names></name>
<name><surname>Paerl</surname> <given-names>R. W.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>New perspectives on picocyanobacteria and understudied cyanobacterial diversity in the albemarle pamlico sound system, north carolina, USA</article-title>. <source>Front. Microbiol.</source> <volume>16</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2025.1539050</pub-id>, PMID: <pub-id pub-id-type="pmid">40415923</pub-id>
</mixed-citation>
</ref>
<ref id="B50">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Scanlan</surname> <given-names>D. J.</given-names></name>
<name><surname>Ostrowski</surname> <given-names>M.</given-names></name>
<name><surname>Mazard</surname> <given-names>S.</given-names></name>
<name><surname>Dufresne</surname> <given-names>A.</given-names></name>
<name><surname>Garczarek</surname> <given-names>L.</given-names></name>
<name><surname>Hess</surname> <given-names>W. R.</given-names></name>
<etal/>
</person-group>. (<year>2009</year>). 
<article-title>Ecological genomics of marine picocyanobacteria</article-title>. <source>Microbiol. Mol. Biol. Rev: MMBR</source> <volume>73</volume>, <fpage>249</fpage>&#x2013;<lpage>299</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/MMBR.00035-08</pub-id>, PMID: <pub-id pub-id-type="pmid">19487728</pub-id>
</mixed-citation>
</ref>
<ref id="B51">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Seemann</surname> <given-names>T.</given-names></name>
</person-group> (<year>2014</year>). 
<article-title>Prokka: rapid prokaryotic genome annotation</article-title>. <source>Bioinformatics</source> <volume>30</volume>, <fpage>2068</fpage>&#x2013;<lpage>2069</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btu153</pub-id>, PMID: <pub-id pub-id-type="pmid">24642063</pub-id>
</mixed-citation>
</ref>
<ref id="B52">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sharifian Gh.</surname> <given-names>M.</given-names></name>
<name><surname>Norouzi</surname> <given-names>F.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Guidelines for an optimized differential centrifugation of cells</article-title>. <source>Biochem. Biophys Rep.</source> <volume>36</volume>, <elocation-id>101585</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.bbrep.2023.101585</pub-id>, PMID: <pub-id pub-id-type="pmid">38076661</pub-id>
</mixed-citation>
</ref>
<ref id="B53">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Sobocinski</surname> <given-names>K.</given-names></name>
</person-group> (<year>2021</year>). <source>State of the salish sea</source>. (<publisher-loc>Bellingham, Washington. United States</publisher-loc>: 
<publisher-name>Salish Sea Institute at Western CEDAR, Western Washington University</publisher-name>). doi:&#xa0;<pub-id pub-id-type="doi">10.25710/vfhb-3a69</pub-id>
</mixed-citation>
</ref>
<ref id="B54">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Visintini</surname> <given-names>N.</given-names></name>
<name><surname>Martiny</surname> <given-names>A. C.</given-names></name>
<name><surname>Flombaum</surname> <given-names>P.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title><italic>Prochlorococcus</italic>, <italic>Synechococcus</italic>, and picoeukaryotic phytoplankton abundances in the global ocean</article-title>. <source>Limnol Oceanogr Lett.</source> <volume>6</volume>, <fpage>207</fpage>&#x2013;<lpage>215</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/lol2.10188</pub-id>, PMID: <pub-id pub-id-type="pmid">41718500</pub-id>
</mixed-citation>
</ref>
<ref id="B55">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wagner</surname> <given-names>A. D.</given-names></name>
<name><surname>Ahmed</surname> <given-names>M. M.A.</given-names></name>
<name><surname>Starks</surname> <given-names>V.</given-names></name>
<name><surname>Boudreau</surname> <given-names>P. D.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Using repeated lysis steps fractionates between heterotrophic and cyanobacterial DNA extracted from xenic cyanobacterial cultures</article-title>. <source>bioRxiv</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2024.08.22.609136</pub-id>, PMID: <pub-id pub-id-type="pmid">39229059</pub-id>
</mixed-citation>
</ref>
<ref id="B56">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Walker</surname> <given-names>S.</given-names></name>
<name><surname>Mozaria-Luna</surname> <given-names>H. N.</given-names></name>
<name><surname>Kaplan</surname> <given-names>I.</given-names></name>
<name><surname>Petat&#xe1;n-Ram&#xed;rez</surname> <given-names>D.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Future temperature and salinity in puget sound, washington state, under CMIP6 climate change scenarios</article-title>. <source>J. Water Climate Change</source> <volume>13</volume>, <fpage>4255</fpage>&#x2013;<lpage>4272</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2166/wcc.2022.282</pub-id>, PMID: <pub-id pub-id-type="pmid">41533551</pub-id>
</mixed-citation>
</ref>
<ref id="B57">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wilkinson</surname> <given-names>M. D.</given-names></name>
<name><surname>Dumontier</surname> <given-names>M.</given-names></name>
<name><surname>Aalbersberg</surname> <given-names>I. J.</given-names></name>
<name><surname>Appleton</surname> <given-names>G.</given-names></name>
<name><surname>Axton</surname> <given-names>M.</given-names></name>
<name><surname>Baak</surname> <given-names>A.</given-names></name>
<etal/>
</person-group>. (<year>2016</year>). 
<article-title>The FAIR guiding principles for scientific data management and stewardship</article-title>. <source>Sci. Data</source> <volume>3</volume>, <fpage>160018</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/sdata.2016.18</pub-id>, PMID: <pub-id pub-id-type="pmid">26978244</pub-id>
</mixed-citation>
</ref>
<ref id="B58">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wright</surname> <given-names>M. N.</given-names></name>
<name><surname>Ziegler</surname> <given-names>A.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>Ranger: A fast implementation of random forests for high dimensional data in C++ and R</article-title>. <source>J. Stat. Softw</source> <volume>77</volume>, <fpage>1</fpage>&#x2013;<lpage>17</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.18637/jss.v077.i01</pub-id>
</mixed-citation>
</ref>
<ref id="B59">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zehr</surname> <given-names>J. P.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>Microbes in earth&#x2019;s aqueous environments</article-title>. <source>Front. Microbiol.</source> <volume>1</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2010.00004</pub-id>, PMID: <pub-id pub-id-type="pmid">21772828</pub-id>
</mixed-citation>
</ref>
<ref id="B60">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>J.</given-names></name>
<name><surname>Li</surname> <given-names>F.</given-names></name>
<name><surname>Long</surname> <given-names>L.</given-names></name>
<name><surname>Huang</surname> <given-names>S.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Quantification of marine picocyanobacteria on water column particles and in sediments using real-time PCR reveals their role in carbon export</article-title>. <source>mSphere</source> <volume>7</volume>, <fpage>e00499</fpage>&#x2013;<lpage>e00422</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/msphere.00499-22</pub-id>, PMID: <pub-id pub-id-type="pmid">36472446</pub-id>
</mixed-citation>
</ref>
<ref id="B61">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zinser</surname> <given-names>E. R.</given-names></name>
<name><surname>Coe</surname> <given-names>A.</given-names></name>
<name><surname>Johnson</surname> <given-names>Z. I.</given-names></name>
<name><surname>Martiny</surname> <given-names>A. C.</given-names></name>
<name><surname>Fuller</surname> <given-names>N. J.</given-names></name>
<name><surname>Scanlan</surname> <given-names>D. J.</given-names></name>
<etal/>
</person-group>. (<year>2006</year>). 
<article-title><italic>Prochlorococcus</italic> ecotype abundances in the north atlantic ocean as revealed by an improved quantitative PCR method</article-title>. <source>Appl. Environ. Microbiol.</source> <volume>72</volume>, <fpage>723</fpage>&#x2013;<lpage>732</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/AEM.72.1.723-732.2006</pub-id>, PMID: <pub-id pub-id-type="pmid">16391112</pub-id>
</mixed-citation>
</ref>
<ref id="B62">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zufia</surname> <given-names>J. A.</given-names></name>
<name><surname>Legrand</surname> <given-names>C.</given-names></name>
<name><surname>Farnelid</surname> <given-names>H.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Seasonal dynamics in picocyanobacterial abundance and clade composition at coastal and offshore stations in the baltic sea</article-title>. <source>Sci. Rep.</source> <volume>12</volume>, <fpage>14330</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-022-18454-8.References</pub-id>, PMID: <pub-id pub-id-type="pmid">41714676</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/319441">Jasna Vijayan</ext-link>, Cochin University of Science and Technology, India</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3325712">Xuhui Huang</ext-link>, Fudan University, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3326217">Joel Sanchez</ext-link>, Estaci&#xf3;n Cient&#xed;fica Coiba (Coiba AIP), Panama</p></fn>
</fn-group>
</back>
</article>