<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2025.1621280</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Marine Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Statistical models for the estimation of pH and aragonite saturation state in the Northwestern Gulf of Mexico</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Jundt</surname>
<given-names>EvaLynn</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2950551/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Hu</surname>
<given-names>Xinping</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/433604/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Harte Research Institute, Texas A&amp;M University-Corpus Christi</institution>, <addr-line>Corpus Christi, TX</addr-line>,&#xa0;<country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Marine Science Institute, The University of Texas at Austin</institution>, <addr-line>Port Aransas, TX</addr-line>,&#xa0;<country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/203340/overview">Joan-Albert Sanchez-Cabeza</ext-link>, National Autonomous University of Mexico, Mexico</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2904602/overview">Xinyu Li</ext-link>, University of Washington, United States</p>
<p>David Mori&#xf1;a, Autonomous University of Barcelona, Spain</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3058000/overview">Zhentao Sun</ext-link>, University of Delaware, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: EvaLynn Jundt, <email xlink:href="mailto:evalynnjundt@gmail.com">evalynnjundt@gmail.com</email>; Xinping Hu, <email xlink:href="mailto:xinping.hu@austin.utexas.edu">xinping.hu@austin.utexas.edu</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>03</day>
<month>09</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>12</volume>
<elocation-id>1621280</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>04</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>07</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Jundt and Hu.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Jundt and Hu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Historical water column carbonate measurements have been scarce in the Gulf of Mexico (GOM); thus, the progression of ocean acidification (OA) is still poorly understood, especially in the subsurface waters. In the literature, statistical models, such as multiple linear regression (MLR), have been created to fill OA data gaps in different ocean regions. Additionally, machine learning techniques such as random forest (RF) have been used in model creations for both the open ocean and marginal seas. However, there is no statistical model for subsurface carbonate chemistry parameters (i.e., pH and &#x3a9;<sub>Arag</sub>) in the GOM. By creating models with various architectures built upon the relationships between commonly measured hydrographic properties (e.g., salinity, temperature, pressure, and dissolved oxygen or DO) and carbonate chemistry parameters (e.g., pH and aragonite saturation state, or &#x3a9;<sub>Arag</sub>), data gaps can be potentially filled in areas with insufficient sampling coverage. In this study, two statistical models were created for pH and &#x3a9;<sub>Arag</sub> in the northwestern GOM (nwGOM) within the range of 27.1&#x2013;29.0&#x2da;N and 89&#x2013;95.1&#x2da;W using both MLR and RF methods. The calibration data used in the models include salinity, temperature, pressure, and DO collected from seven cruises that took place between July 2007 and February 2023. The models predict &#x3a9;<sub>Arag</sub> with <italic>R</italic>
<sup>2</sup> &#x2265; 0.94, mean square error (MSE) &#x2264; 0.04, and pH with <italic>R</italic>
<sup>2</sup> &#x2265; 0.93, MSE &#x2264; 0.0005. Both the MLR and RF models perform similarly. These models are valuable tools for reconstructing pH and &#x3a9;<sub>Arag</sub> data where direct chemical observations are absent but hydrographic information is available in the nwGOM. Nevertheless, potential shifts in circulation, water mass changes, and accumulation of anthropogenic CO<sub>2</sub> need to be accounted for to improve and revise these models in the future.</p>
</abstract>
<kwd-group>
<kwd>ocean acidification</kwd>
<kwd>Gulf of Mexico</kwd>
<kwd>statistical models</kwd>
<kwd>carbonate chemistry</kwd>
<kwd>predictive models</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="2"/>
<equation-count count="5"/>
<ref-count count="77"/>
<page-count count="13"/>
<word-count count="8182"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Marine Biogeochemistry</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>The capability of oceans to store absorbed CO<sub>2</sub> from the atmosphere is attributed to seawater&#x2019;s buffering capability. Through a chain of processes, from CO<sub>2</sub> dissolution to carbonic acid dissociation, only a small amount of absorbed CO<sub>2</sub> remains undissociated (i.e., aqueous CO<sub>2</sub>, or CO<sub>2</sub>
<sup>*</sup>) (<xref ref-type="bibr" rid="B76">Zeebe et&#xa0;al., 2011</xref>). Due to this reaction, CO<sub>2</sub> invasion into seawater results in changes to the speciation of the carbonate system. Thus, while the increase in CO<sub>2</sub>
<sup>*</sup> is proportional to the CO<sub>2</sub> increase in the atmosphere, the extent of the total dissolved inorganic carbon (DIC) concentration increase is lower than that in the atmosphere. As a result, carbonate ion (CO<sub>3</sub>
<sup>2&#x2212;</sup>) concentration decreases along with the release of H<sup>+</sup>, and carbonate saturation state (&#x3a9;) decreases following <xref ref-type="disp-formula" rid="eq1">Equation 1</xref>.</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3a9;</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>p</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo stretchy="false">[</mml:mo>
<mml:mi>C</mml:mi>
<mml:msup>
<mml:mi>a</mml:mi>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>+</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo stretchy="false">]</mml:mo>
<mml:mo stretchy="false">[</mml:mo>
<mml:mi>C</mml:mi>
<mml:msubsup>
<mml:mi>O</mml:mi>
<mml:mn>3</mml:mn>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#x2212;</mml:mo>
</mml:mrow>
</mml:msubsup>
<mml:mo stretchy="false">]</mml:mo>
<mml:mo stretchy="false">/</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>K</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:msup>
<mml:mi>p</mml:mi>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Here, [Ca<sup>2+</sup>] is the concentration of calcium ions, and K<sub>sp&#x2019;</sub> is the stoichiometric solubility product (<xref ref-type="bibr" rid="B77">Zeebe and Wolf-Gladrow, 2001</xref>). K<sub>sp</sub>
<sup>&#x2019;</sup> is a function of the mineral phase (calcite or aragonite), pressure, salinity, and temperature. Based on thermodynamics, calcification is favored when &#x3a9; &gt; 1 (supersaturation), while dissolution is favored when &#x3a9; &lt; 1 (undersaturation). Ocean acidification (OA) can lead to unfavorable conditions for calcareous organisms such as corals, shellfish, calcareous algae, and other important calcifying species on the ocean food web (such as pteropods) by affecting their calcification (<xref ref-type="bibr" rid="B7">Bednar&#x161;ek et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B29">Erez et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B31">Eyre et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B37">Hoegh-Guldberg et&#xa0;al., 2007</xref>).</p>
<p>Although there has been increasing effort in collecting carbonate chemistry data, creating novel applications of models to supplement existing datasets in many areas, especially the coastal ocean, including the GOM, is still needed. Currently, the data coverage in the nwGOM is limited to infrequent water chemistry data collections from several NOAA-led cruises (<xref ref-type="bibr" rid="B6">Barbero et&#xa0;al., 2024</xref>, <xref ref-type="bibr" rid="B5">2017</xref>; <xref ref-type="bibr" rid="B60">Peng and Langdon, 2007</xref>; <xref ref-type="bibr" rid="B74">Wanninkhof et&#xa0;al., 2012</xref>) and those from our study. New methods are being put into practice to remedy the missing data, including autonomous measurements, although many of these platforms are limited with measuring pH and CO<sub>2</sub> partial pressure (<italic>p</italic>CO<sub>2</sub>), hence, available datasets often lack the necessary information for characterizing OA conditions in the coastal region.</p>
<p>In recent years, statistical modeling based on hydrographic data has been used to fill in data gaps in water column carbonate chemistry datasets (<xref ref-type="bibr" rid="B43">Juranek et&#xa0;al., 2009</xref>), as such data (including salinity, temperature, dissolved oxygen or DO, and sometimes nutrients) are much more widely available. By creating models using commonly measured hydrographic data, information such as &#x3a9;<sub>Arag</sub> (i.e., aragonite saturation state), pH, total dissolved inorganic carbon (DIC), and total alkalinity (TA) can be calculated (e.g., <xref ref-type="bibr" rid="B15">Carter et&#xa0;al., 2018</xref>). An early example of these studies was done for &#x3a9;<sub>Arag</sub> on the continental shelf of central Oregon (<xref ref-type="bibr" rid="B43">Juranek et&#xa0;al., 2009</xref>), where a multilinear regression (MLR) model using temperature and oxygen was developed for &#x3a9;<sub>Arag</sub> (coefficient of determination or <italic>R</italic>
<sup>2</sup> = 0.987, with mean standard error or MSE of 0.003). This MLR model was used for constructing comprehensive water-column &#x3a9;<sub>Arag</sub> values to evaluate the seasonal evolution of &#x3a9;<sub>Arag</sub>. The application of MLR models with adjustments for anthropogenic CO<sub>2</sub> to determine &#x3a9;<sub>Arag</sub> using historical datasets was done in a study in the Sea of Japan (East Sea), where a similar model was applied to a historical dataset lacking &#x3a9;<sub>Arag</sub>, resulting in an &#x3a9;<sub>Arag</sub> dataset from 1960 to 2000 (<xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>). Similar models have also been proven effective for the prediction of &#x3a9;<sub>Arag</sub> in other locations, with some model applications including TA and DIC (<xref ref-type="bibr" rid="B1">Alin et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B8">Bostock et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B36">Hare et&#xa0;al., 2025</xref>; <xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B14">Carter at al., 2021</xref>).</p>
<p>Our study developed statistical models using both and random forest (RF) architectures for the purpose of predicting pH and &#x3a9;<sub>Arag</sub> in the northwestern Gulf of Mexico (nwGOM). <xref ref-type="disp-formula" rid="eq2">Equation 2</xref> was used to represent the MLR model, where Y is the target variable, &#x3b2;<sub>0</sub> is the y-intercept, &#x3b2;<sub>x</sub> represents the slope intercept, X<sub>x</sub> is the predictor variables and &#x3f5; is the error term. MLR is a popular and effective linear modeling technique that has been applied in a vast number of research areas, including the aforementioned successful applications to marine carbonate chemistry, and thus was a clear choice.</p>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mi>Y</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>+</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>&#x3b2;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>+</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>+</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>&#x3f5;</mml:mi>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Machine learning has emerged as an alternative to linear models in numerous fields (<xref ref-type="bibr" rid="B68">Thessen, 2016</xref>). The proliferation of machine learning techniques has led to the development of methods for a wide variety of datasets and goals. The simplest machine learning models, such as decision trees and RF models, which are constructed from a group of decision trees, each trained on a distinct subset of data. These three based models are frequently preferred when applicable due to their explanatory capability through feature importance, low computing power requirements, and ability to operate on relatively small datasets (<xref ref-type="bibr" rid="B22">Cutler et&#xa0;al., 2007</xref>). RF is a versatile and powerful ensemble learning method capable of producing high-quality predictions while effectively handling noisy data and mitigating common challenges such as overfitting (<xref ref-type="bibr" rid="B9">Breiman, 2001</xref>). By aggregating the predictions of multiple decision trees, each trained on distinct subsets of data, the randomness introduced by this approach enhances prediction accuracy and diminishes the risk of overfitting (<xref ref-type="bibr" rid="B68">Thessen, 2016</xref>). Moreover, RF offers interpretability that many other machine learning models lack, through assessment of feature importance, which measures how much each feature contributes to reducing impurity (like variance) across all the trees in the forest, indicating its overall influence on the model&#x2019;s predictions. This combination of robustness, accuracy, and interpretability makes RF well suited for both classification and regression tasks (<xref ref-type="bibr" rid="B68">Thessen, 2016</xref>). For this study, statistical and machine learning methods were used to create MLR and RF models using measured hydrographic data (salinity, temperature, pressure, DO) to estimate pH and &#x3a9;<sub>Arag</sub>. These models will have the capacity not only to estimate pH and &#x3a9;<sub>Arag</sub> using existing datasets but also could pair with current and potentially future autonomous observation platforms to create near real-time estimated pH and &#x3a9;<sub>Arag</sub> coverage within the recommended timeframe (i.e., the next 10 years). This study will also serve as a valuable baseline of data for future OA research in the nwGOM.</p>
</sec>
<sec id="s2">
<title>Methods</title>
<sec id="s2_1">
<title>Dataset description</title>
<p>Water column studies focusing on the carbonate system in the GOM shelf and upper slope (up to 1000 m) region include GOMECC cruises 1&#x2013;4 in 2007, 2012, 2017, and 2021 (<xref ref-type="bibr" rid="B6">Barbero et&#xa0;al., 2024</xref>, <xref ref-type="bibr" rid="B5">2017</xref>; <xref ref-type="bibr" rid="B60">Peng and Langdon, 2007</xref>; <xref ref-type="bibr" rid="B74">Wanninkhof et&#xa0;al., 2012</xref>) (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). In addition to these large-scale expeditions, regional datasets also exist from individual studies focusing largely on the northern GOM shelf (<xref ref-type="bibr" rid="B13">Cai et&#xa0;al., 2020</xref>, <xref ref-type="bibr" rid="B12">2011</xref>; <xref ref-type="bibr" rid="B38">Hu et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B40">Huang et&#xa0;al., 2015</xref>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Summary of datasets included in this research study.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" colspan="2" align="center">Name</th>
<th valign="middle" align="center">Date</th>
<th valign="middle" align="center"># Observations</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="3" align="center">GOMECC</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">July 2007</td>
<td valign="middle" align="center">90</td>
</tr>
<tr>
<td valign="middle" align="center">3</td>
<td valign="middle" align="center">July 2017</td>
<td valign="middle" align="center">131</td>
</tr>
<tr>
<td valign="middle" align="center">4</td>
<td valign="middle" align="center">October 2021</td>
<td valign="middle" align="center">59</td>
</tr>
<tr>
<td valign="middle" rowspan="4" align="center">XR</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">April 2021</td>
<td valign="middle" align="center">104</td>
</tr>
<tr>
<td valign="middle" align="center">2</td>
<td valign="middle" align="center">August 2021</td>
<td valign="middle" align="center">107</td>
</tr>
<tr>
<td valign="middle" align="center">3</td>
<td valign="middle" align="center">December 2022</td>
<td valign="middle" align="center">57</td>
</tr>
<tr>
<td valign="middle" align="center">4</td>
<td valign="middle" align="center">February 2023</td>
<td valign="middle" align="center">121</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Number of observations column indicates the total number of observations from each cruise included in modeling after modification for target depth and calculation of necessary parameters.</p>
</table-wrap-foot>
</table-wrap>
<p>From April 2021 to February 2023, five cruises were conducted in the nwGOM shelf and upper slope to collect both surface and water column data across different seasons as a part of the project &#x201c;Ocean Acidification at a Crossroad&#x201d; (XR) (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). Among the stations sampled were those along the Galveston transect, which is a transect along the 95&#xb0; W longitude first taken during GOMECC-1 cruise. This transect was sampled on GOMECCs 3 and 4 and again by the XR project in April and August of 2021, December of 2022, and February of 2023 (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>; <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). The combined dataset before circulations QC and preparation included 960 data points from 36 stations, out of which 94 of these data points from the GOMECC-4 cruise were to be used for testing the models while the remaining 866 data points were to be split (90:10) and used for model training and calibration.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>A map of the study area and stations where data was collected.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1621280-g001.tif">
<alt-text content-type="machine-generated">Map of the Gulf Coast showing various stations. Locations are marked by colored circles: red for GOMECC 3, green for GOMECC 1, teal for GOMECC 4, and purple for XR. The circles are distributed along the coast from 96&#xb0;W to 90&#xb0;W.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s2_2">
<title>Sampling and analytical methods</title>
<p>Seawater sampling for the XR cruises was done following the best practices for carbonate chemistry analysis (<xref ref-type="bibr" rid="B25">Dickson et&#xa0;al., 2007</xref>). Briefly, samples were taken from the Niskin bottles into 250-ml ground-neck borosilicate glass bottles. Preservation of samples for carbonate chemistry analyses was done by adding 100 &#x3bc;l of saturated HgCl<sub>2</sub> solution. Glass stoppers with the aid of Apiezon<sup>&#xae;</sup> L grease and rubber bands were used to seal the samples. The GOMECC samples were analyzed on board the ship, including DO, DIC, and TA; nutrient samples were analyzed at the Atlantic Oceanographic and Meteorological Laboratory (AOML) (<xref ref-type="bibr" rid="B5">Barbero et&#xa0;al., 2017</xref>, <xref ref-type="bibr" rid="B6">2024</xref>; <xref ref-type="bibr" rid="B60">Peng and Langdon, 2007</xref>; <xref ref-type="bibr" rid="B74">Wanninkhof et&#xa0;al., 2012</xref>). All XR carbonate chemistry (DIC, pH, and TA) samples were analyzed in our lab at Texas A&amp;M University-Corpus Christi (<xref ref-type="bibr" rid="B39">Hu et&#xa0;al., 2018</xref>), and DO was analyzed on board the ship. Nutrient samples were analyzed at the Geochemical and Environmental Research Group at Texas A&amp;M University.</p>
<p>For the GOMECC samples, DO was determined using an automated oxygen titrator with amperometric end-point detection (<xref ref-type="bibr" rid="B21">Culberson and Huang, 1987</xref>). DIC was determined using gas calibrations and Certified Reference Material (CRM) stability checks to ensure proper performance (with precisions of &#xb1; 1.37 &#xb5;mol/kg) (<xref ref-type="bibr" rid="B41">Johnson et&#xa0;al., 1985</xref>). For the XR samples, DO was determined on a selected subset of the samples using Winkler titration (<xref ref-type="bibr" rid="B20">Culberson, 1991</xref>; <xref ref-type="bibr" rid="B75">Winkler, 1888</xref>), as these water samples were used to verify the DO sensor on the onboard the CTD (<xref ref-type="bibr" rid="B26">DiMarco et&#xa0;al., 2012</xref>). DIC was determined using infrared methodology on a DIC analyzer (Apollo SciTech Inc.) with CRM to ensure optimal instrument performance (with precisions of &#xb1;0.1%) (<xref ref-type="bibr" rid="B17">Chen et&#xa0;al., 2015</xref>). For all cruises, TA was analyzed using open-cell Gran titration (<xref ref-type="bibr" rid="B34">Gran, 1952</xref>), and pH was analyzed using a spectrophotometric method with purified m-cresol purple (<xref ref-type="bibr" rid="B48">Liu et&#xa0;al., 2011</xref>). Due to the COVID-19-caused interruption to CRM supply in early 2021, XR1 samples were analyzed using CRM Batch #181 and a homemade secondary reference (based on CRM Batch #181) taken from filtered (0.2 &#xb5;m) and HgCl<sub>2</sub>-dosed Aransas Ship Channel water. XR2 samples used CRM Batch #194, 197, and 198; XR3 samples used CRM Batch #202 and 204; and XR4 samples used Batch #204 only, while XR5 samples used Batch #204 and 205.</p>
</sec>
<sec id="s2_3">
<title>Calculations, QC, and data preparation</title>
<p>Speciation calculations for the GOMECC-1 data used TA, DIC, and nutrients as input variables as direct pH measurement using the spectrophotometric method was not available. Estimated uncertainties using the average surface water conditions for pH and &#x2126;<sub>Arag</sub> were &#xb1;0.01 and &#xb1;0.17, respectively (<xref ref-type="bibr" rid="B56">Orr et&#xa0;al., 2018</xref>); then DIC and pH were used for speciation calculations in all other GOMECC datasets as well as the XR ones without nutrient data, resulting in an uncertainty in &#x2126;<sub>Arag</sub> of &#xb1;0.18. Though some calculations were done without nutrients, uncertainty contributed to the combined standard uncertainty are negligible even in high-nutrient regions, except in high-nutrient waters with TA as a member of the input pair (<xref ref-type="bibr" rid="B56">Orr et&#xa0;al., 2018</xref>). Carbonate speciation calculation was done using the MatLab version program CO2SYS (<xref ref-type="bibr" rid="B65">Sharp et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B71">van Heuven et&#xa0;al., 2011</xref>). Carbonate dissociation constants from <xref ref-type="bibr" rid="B51">Mehrbach et&#xa0;al. (1973)</xref> refit by <xref ref-type="bibr" rid="B23">Dickson and Millero (1987)</xref>, the dissociation constant of bisulfate reported in <xref ref-type="bibr" rid="B24">Dickson et al. (1990)</xref>, the total boron concentration provided in <xref ref-type="bibr" rid="B70">Uppstr&#xf6;m (1974)</xref>, and the aragonite solubility constant from <xref ref-type="bibr" rid="B55">Mucci (1983)</xref> were used in these calculations. As nutrient data were not available for the XR cruises due to technical issues encountered during the pandemic, we were not able to do a strict internal consistency analysis because using TA as one of the input variables would require nutrient information. However, the offset between calculated (using DIC/pH without nutrients, except for GOMECC-1) and measured TA values, was compared across all cruises to ensure that data quality was consistent among these trips (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>) (<xref ref-type="bibr" rid="B58">Patsavas et&#xa0;al., 2015</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Visuals for quality control comparisons of analysis between XR and GOMECC datasets. Boxplot <bold>(a)</bold> showing distribution of &#x394;TA by calculation inputs separated by depth. Scatterplot <bold>(b)</bold> visualizing the spread of &#x394;TA by calculation inputs by measured TA values.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1621280-g002.tif">
<alt-text content-type="machine-generated">Panel a shows box plots of residuals of total alkalinity in micromoles per kilogram across various depths for GOMECC and XR, indicating similar distributions. Panel b is a scatter plot comparing measured values to residuals, with GOMECC and XR data points closely clustered around the zero line.</alt-text>
</graphic>
</fig>
<p>When modeling carbonate chemistry, it is crucial to focus on a geographic area where local processes and water masses exert similar control. This ensures that the relationships between parameters remain consistent throughout the area and are accurately captured in the models. Hence, data used for our model development were limited spatially within the range of 27.1&#x2013;29.0&#x2da;N and 89&#x2013;95.1&#x2da;W. Removal of the upper water column of various depths is regularly done in some capacity in carbonate modeling studies in an attempt to remove large, short-term, unconstrained variabilities, such as surface water gas exchange, physical, biological, and seasonal changes (<xref ref-type="bibr" rid="B43">Juranek et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B47">Lima et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>). Depth ranges of the mixed layer to be removed vary by location and season. Some models do not require exclusion of air-surface water interactions due to predictor variables being unaffected by this exchange, and others have used removal of additional surface water as a means of removing the effect of seasonality (<xref ref-type="bibr" rid="B43">Juranek et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B47">Lima et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B52">Montes et&#xa0;al., 2016</xref>). Since the models produced in this study could contain DO, removing air-sea interaction was necessary. However, the removal of the mixed layer to eliminate seasonality as done by <xref ref-type="bibr" rid="B44">Kim et&#xa0;al. (2010)</xref> would equate to a removal of more than 100 m to account for the seasonal changes in mixed layer depth, as winter mixed layer depth in nwGOM can be more than 100 m (<xref ref-type="bibr" rid="B54">Muller-Karger et&#xa0;al., 2015</xref>). To retain as much data as possible while removing seasonality, removal of the upper 30 m of data was arbitrarily chosen. Note this removal should more than cover the depth of the mixed layer in summer but is shallower than those depths in winter and spring. The predictor parameters (salinity, temperature, pressure, and DO) were normalized to avoid collinearity, which causes computational problems that make parameter estimates unstable (<xref ref-type="bibr" rid="B62">Quinn and Keough, 2002</xref>). This was done through computing <italic>Z</italic>-scores using <xref ref-type="disp-formula" rid="eq3">Equation 3</xref>, where X<sub>i</sub> is the predictor variable data point, X<sub>m</sub> is the mean of the calibration set, and X<sub>SD</sub> is the standard deviation of the calibration set. This can be described as centering by subtracting the mean and dividing by the standard deviation, resulting in predictor variables having a mean of 0 and a standard deviation of 1.</p>
<disp-formula id="eq3">
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>D</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>This approach uses normalized predictor variables to estimate nonnormalized target variables, so the relative importance of multiple parameters can be compared within one model through the magnitude of the coefficients. The normalized predictor variables were tested for collinearity by calculating the variance inflation factor (VIF) for each predictor. Combinations of terms resulting in a VIF greater than 10, indicating excessive collinearity, were not used in any model (<xref ref-type="bibr" rid="B45">Kutner et&#xa0;al., 2005</xref>). Outliers were identified using studentized residuals, which are more effective for detecting outlying Y observations than standardized residuals. Studentized residuals larger than 3 (which are classified as outliers) were further examined. Each data point was individually evaluated, considering corresponding measurements from the same sample for consistency. Data flagged as questionable across multiple parameters were carefully considered, and if multiple indicators suggested potential error, the observation was excluded from the dataset. Any data points with studentized residuals &gt;5 were removed due to the likelihood of being erroneous or anomalous.</p>
</sec>
<sec id="s2_4">
<title>Model creation</title>
<p>The modeling exercise was conducted in Python using the <italic>Scikit-learn</italic> packages (<xref ref-type="bibr" rid="B59">Pederegosa et al., 2011</xref>). Using a combination of the measured data (salinity or S; temperature or T; DO; and pressure, or P), these techniques produced RF and MLR models for pH and &#x3a9;<sub>Arag</sub>. The predictor variables were selected by dredge for MLR models or variable importance for RF models (see below for details). The process was repeated until either <italic>R</italic>
<sup>2</sup> values were &lt;0.90 or only one predictor variable remained. Final predictor variable selections were used to create final models that were evaluated.</p>
<p>MLR - Empirical models were developed for each target variable (i.e., pH and &#x3a9;<sub>Arag</sub>) using least squares multiple linear regression on each combination of hydrographic variables, following the methods of <xref ref-type="bibr" rid="B43">Juranek et&#xa0;al. (2009)</xref> and <xref ref-type="bibr" rid="B1">Alin et&#xa0;al. (2012)</xref>. All parameters (DO, S, T, P) in the training data were given as predictors to a full MLR model. Dredge methodology was used to evaluate every possible combination of the four parameters. From among the combinations, all models were ranked based on minimizing the Akaike information criterion (AIC), a metric for model selection that incorporates both the goodness of fit and a penalty for complexity (<xref ref-type="bibr" rid="B10">Burnham and Anderson, 2004</xref>). The best performing models with <italic>R</italic>
<sup>2</sup> &gt; 0.90 and correlation coefficients with correct signs (&#xb1;) were selected for further evaluation.</p>
<p>RF - An initial RF model was created including all four variables. Hyperparameter tuning is the process of optimizing a model&#x2019;s configuration settings to improve performance by specifying tuned values for the number of trees, max tree depth, and minimum samples split. Hyperparameters for tuning were decided using scickit-learn GridSearchCV (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>). Selected hyperparameters were applied using an RF regressor function (<xref ref-type="bibr" rid="B61">Probst et&#xa0;al., 2019</xref>). After this step, the variable importance was analyzed, and a stepwise procedure was followed to create a new model without the variable of least importance. The new model was then tuned and evaluated, if the model's R2 &gt; 0.90 it would be considered in the final model valuation. In addition, the process starting by analyzing feature importance to create a simpler model was continued until the resulting model did not meet previously stated criteria.</p>
</sec>
<sec id="s2_5">
<title>Model evaluation</title>
<p>The models were used to predict their target variable while using predictor variable data from the completely &#x201c;unseen data,&#x201d; or data uninvolved in the training process, in this instance, the GOMECC-4 data. By using data from a cruise, which also took place within the time period that the modeled data were collected, separate from the training data, this ensures that the model performance results will accurately represent the models&#x2019; efficacy on new data. To ensure that the test dataset is representative of the training dataset and that the distributions of the variables are not problematically different, a two-step evaluation process was conducted. First, the distribution of each variable in both the training and test datasets was visually examined using graphical representations, such as histograms, density plots, or boxplots, to identify any noticeable differences. Second, the Kolmogorov&#x2013;Smirnov (KS) test, a non-parametric statistical test, was applied to each variable to evaluate whether two samples are drawn from the same underlying distribution by comparing their cumulative distribution functions (<xref ref-type="bibr" rid="B49">Massey, 1951</xref>). These analyses collectively concluded that the training and test datasets are statistically comparable, minimizing the risk of bias in model evaluation due to distributional differences.</p>
<p>After confirmation of the representative quality of the test data, model evaluations were based on the performance across multiple metrics, including mean absolute error (MAE), mean square error (MSE), mean absolute percent error (MAPE), correlation coefficient R<sup>2</sup>, and spatial bias (<xref ref-type="bibr" rid="B72">Vujovic, 2021</xref>). MAE and MSE represent the absolute-difference and the squared-difference metrics, respectively. MLR model variable coefficients were used for interpretation of relative variable effect. The RF model variable importance best describes model fit, not direct variable relationships, and therefore was not interpreted this way, that is, variable effect. Additional analysis of the residual data to identify normality and potential signals was done using QQ-plots and Shapiro&#x2013;Wilks tests (<xref ref-type="bibr" rid="B18">Chen et&#xa0;al., 2019</xref>) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures S1</bold>
</xref>-<xref ref-type="supplementary-material" rid="SM1">
<bold>S8</bold>
</xref>).</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<p>The models chosen to predict both &#x2126;<sub>Arag</sub> and pH included different combinations of the following parameters: salinity, temperature, pressure, and DO (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). All linear combinations of hydrographic parameters in the models presented here resulted in VIFs less than 10, suggesting that there is no statistical evidence of coupling between any of the predictor variables. The MLR and RF models for &#x2126;<sub>Arag</sub> had adjusted <italic>R</italic>
<sup>2</sup> values between 0.94 and 0.99 and MAE values between 0.06 and 0.14. The MLR and RF models for pH had adjusted R<sup>2</sup> values between 0.93 and 0.96 and MAE values between 0.01 and 0.02. As shown in <xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref> and <xref ref-type="fig" rid="f4">
<bold>4</bold>
</xref>, the residuals for all model versions displayed some visually identifiable tendency for greater error in shallower depths. This, in combination with poorer performance of models including all depths, supports the choice made to mitigate uncertainty caused by air-sea interaction by the exclusion of the mixed layer in some capacity (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>). MAPE statistics indicate the models for pH displayed less deviation between predicted and actual values and may perform better when used with new data (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). These model evaluative criteria indicate that both models produced reliable results across the range of observed values in the calibration dataset (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4</bold>
</xref>).</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Summary of all models for the prediction of pH including their performance metrics and variable importance for RF models and coefficients for MLR models.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">
</th>
<th valign="middle" align="center">MSE</th>
<th valign="middle" align="center">MAE</th>
<th valign="middle" align="center">MAPE</th>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="middle" align="center">MSE</th>
<th valign="middle" align="center">MAE</th>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="middle" align="center">Temperature</th>
<th valign="middle" align="center">Dissolved Oxygen</th>
<th valign="middle" align="center">Pressure</th>
<th valign="middle" align="center">Salinity</th>
<th valign="middle" align="center">Intercept</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">&#x3a9;<sub>Arag</sub> RF 3</td>
<td valign="middle" align="center">0.010</td>
<td valign="middle" align="center">0.071</td>
<td valign="middle" align="center">0.029</td>
<td valign="middle" align="center">0.987</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.011</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.068</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.985</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.56</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.09</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.35</td>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
</tr>
<tr>
<td valign="middle" align="center">&#x3a9;<sub>Arag</sub> RF 2</td>
<td valign="middle" align="center">0.021</td>
<td valign="middle" align="center">0.095</td>
<td valign="middle" align="center">0.039</td>
<td valign="middle" align="center">0.971</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.025</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.095</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.966</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.61</td>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.39</td>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
</tr>
<tr>
<td valign="middle" align="center">&#x3a9;<sub>Arag</sub> RF 1</td>
<td valign="middle" align="center">0.037</td>
<td valign="middle" align="center">0.130</td>
<td valign="middle" align="center">0.051</td>
<td valign="middle" align="center">0.949</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.044</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.135</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.94</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">1</td>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
</tr>
<tr>
<td valign="middle" align="center">&#x3a9;<sub>Arag</sub> MLR 4</td>
<td valign="middle" align="center">0.009</td>
<td valign="middle" align="center">0.072</td>
<td valign="middle" align="center">0.032</td>
<td valign="middle" align="center">0.987</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.01</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.056</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.986</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.3982</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.3722</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">-0.0544</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.0989</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">2.5369</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>&#x3a9;</bold>
<sub>Arag</sub> <bold>MLR 3</bold>
</td>
<td valign="middle" align="center">
<bold>0.010</bold>
</td>
<td valign="middle" align="center">
<bold>0.071</bold>
</td>
<td valign="middle" align="center">
<bold>0.032</bold>
</td>
<td valign="middle" align="center">
<bold>0.987</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.011</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.063</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.984</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.4367</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.3687</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>-0.1127</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>2.537</bold>
</td>
</tr>
<tr>
<td valign="middle" align="center">
<bold>pH RF 3</bold>
</td>
<td valign="middle" align="center">
<bold>0.0003</bold>
</td>
<td valign="middle" align="center">
<bold>0.013</bold>
</td>
<td valign="middle" align="center">
<bold>0.002</bold>
</td>
<td valign="middle" align="center">
<bold>0.959</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.0002</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.013</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.961</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.15</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.75</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">
<bold>0.1</bold>
</td>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
</tr>
<tr>
<td valign="middle" align="center">pH MLR 3</td>
<td valign="middle" align="center">0.001</td>
<td valign="middle" align="center">0.018</td>
<td valign="middle" align="center">0.002</td>
<td valign="middle" align="center">0.929</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.0005</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.017</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.929</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">-0.0078</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.0647</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">-0.0432</td>
<td valign="middle" align="center" style="background-color:#d9d9d9"/>
<td valign="middle" align="center" style="background-color:#d9d9d9">7.9512</td>
</tr>
<tr>
<td valign="middle" align="center">pH MLR 4</td>
<td valign="middle" align="center">0.000</td>
<td valign="middle" align="center">0.016</td>
<td valign="middle" align="center">0.002</td>
<td valign="middle" align="center">0.946</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.0003</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.011</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.955</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">-0.0232</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.0661</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">-0.0198</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">0.0396</td>
<td valign="middle" align="center" style="background-color:#d9d9d9">7.9511</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Unshaded area includes results from performance of validation dataset; shaded area indicates performance of unseen test data. Number in the model ID reflects the number of variables used in the model. MSE is mean square error, MAE is mean absolute error, MAPE is mean absolute percent error, <italic>R</italic>
<sup>2</sup> is the correlation coefficient. The rows with the bold fonts indicate the best models.Note the first column includes modeled parameter (&#x3a9;<sub>Arag</sub> and pH), and the numbers after the statistical models (RF or MLR) indicate the number of predicting variables used.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>pH models predicted values plotted by measured values from models&#x2019; application to test dataset (GOMECC4) <bold>(a)</bold>, residuals plotted by measured &#x2126;<sub>Arag</sub> <bold>(b)</bold>, and depth <bold>(c)</bold>. Points color coded for each model (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1621280-g003.tif">
<alt-text content-type="machine-generated">Three scatter plots illustrate pH models. Plot a: predicted versus measured pH, showing a strong linear correlation. Plot b: residuals versus measured pH, displaying a spread centered near zero. Plot c: residuals versus depth, with points scattered around the zero line, indicating consistent model performance across depths. RF 4, MLR 3, and MLR 4 models are represented by different colors: green, orange, and blue.</alt-text>
</graphic>
</fig>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>&#x2126;<sub>Arag</sub> models predicted values plotted by measured values from models&#x2019; application to test dataset (GOMECC4) <bold>(a)</bold>, residuals plotted by measured &#x2126;<sub>Arag</sub> <bold>(b)</bold> and depth <bold>(c)</bold>. Points color coded for each model (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1621280-g004.tif">
<alt-text content-type="machine-generated">Three scatter plots labeled a, b, and c show &#x3a9;_Arag model data. Plot a compares predicted and measured &#x3a9;_Arag values with a strong linear correlation. Plot b displays residuals by measured &#x3a9;_Arag with scattered points around zero. Plot c shows residuals by depth, with similar scatter patterns. Each plot includes data points in blue, orange, and green representing different models, labeled as RF 3, RF 2, and MLR 3.</alt-text>
</graphic>
</fig>
<disp-formula id="eq4">
<label>(4)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:msubsup>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>+</mml:mo>
<mml:msubsup>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>+</mml:mo>
<mml:msubsup>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq5">
<label>(5)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mi>U</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>B</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Uncertainty propagations were calculated using <xref ref-type="disp-formula" rid="eq4">Equation 4</xref> (<xref ref-type="bibr" rid="B15">Carter et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B46">Li et&#xa0;al., 2022</xref>). <italic>E</italic>
<sub>MLR</sub> refers to the model RMSE. <italic>E</italic>
<sub>Response</sub> represents measurement uncertainties; for pH, this is the spectrophotometric measurement uncertainty, which was set conservatively to be a constant 0.005 (<xref ref-type="bibr" rid="B16">Carter et&#xa0;al., 2024</xref>). For &#x2126;<sub>Arag</sub> this is the uncertainty from input pairs propagated through calculations of &#x2126;<sub>Arag</sub> which was set as 0.085 (<xref ref-type="bibr" rid="B56">Orr et&#xa0;al., 2018</xref>). <italic>E</italic>
<sub>input</sub> is the uncertainty of the input parameters propagated in the regression, which can be calculated using <xref ref-type="disp-formula" rid="eq5">Equation 5</xref>, where <italic>U</italic>
<sub>i</sub> is the <italic>i-</italic>th input uncertainties of the predictor properties. We set the <italic>U<sub>i</sub>
</italic> values at 0.005, 0.005&#xb0;C, and 2.2 &#xb5;mol kg<sup>&#x2212;1</sup> for S, T, and DO, respectively (<xref ref-type="bibr" rid="B15">Carter et&#xa0;al., 2018</xref>). Total uncertainty calculated is 0.12 for &#x2126;<sub>Arag</sub> and 0.0173 for pH. Other information that can be inferred from these calculations is the relative sources of uncertainty by the comparison of <italic>E</italic>
<sub>Response</sub>, <italic>E</italic>
<sub>Input</sub>, and <italic>E</italic>
<sub>MLR</sub>. In both cases the <italic>E</italic>
<sub>MLR</sub> value was the largest contributor of uncertainty, followed by <italic>E</italic>
<sub>Response</sub>.</p>
<p>In addition to the total uncertainty calculations, a better understanding of the source of the uncertainty described by the <italic>E</italic>
<sub>MLR</sub> can be achieved by examining the calculations of error used to describe model performance, such as MAPE and MAE. &#x2126;<sub>Arag</sub> models produced MAPE scores of 2.9%&#x2013;5.1% and MAE of 0.05&#x2013;0.13 in comparison to estimates of error propagation for calculation of &#x2126;<sub>Arag</sub> being &#xb1;0.16 depending on input pairs (<xref ref-type="bibr" rid="B56">Orr et&#xa0;al., 2018</xref>). Most of the uncertainty from calculation comes from the pair-constants curve, meaning methodological uncertainties for the input pairs result in little effect on the overall propagated uncertainties. Therefore, the relative uncertainty due to error of model &#x2126;<sub>Arag</sub> values has similar reliability to calculations of &#x2126;<sub>Arag</sub> from measured DIC, TA, or pH values. This was not true for pH models, as MAPE scores ranged from 0.16% to 0.22%, with an MAE of 0.011&#x2013;0.018 in comparison to a relative uncertainty of measurement methods of 0.008&#x2013;0.0012, meaning that there is a higher confidence of measured values as opposed to predicted (<xref ref-type="bibr" rid="B66">Takeshita et&#xa0;al., 2021</xref>).</p>
<p>The best model for &#x2126;<sub>Arag</sub> was the MLR model, which included all variables with an <italic>R</italic>
<sup>2</sup> = 0.99. (&#x3a9;<sub>Arag</sub> MLR 4; <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). MLR equation coefficients indicate that for the &#x2126;<sub>Arag</sub> model, variable importance, or contribution to explainability, is as follows, from most to least important: temperature, DO, pressure, and salinity, with temperature and DO being &gt;77% larger than pressure and salinity. The second-best performing model with <italic>R</italic>
<sup>2</sup> = 0.98 is the MLR model with three variables, which, in order of importance, are temperature, DO, and pressure (&#x3a9;<sub>Arag</sub> MLR 3; <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The RF models did not outperform MLR models but came close behind, with the best RF model (&#x3a9;<sub>Arag</sub> RF 3; <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>) having an <italic>R</italic>
<sup>2</sup> = 0.99 while using the same three variables as the second-best MLR model. For the RF models, poorer performance on test data than validation data would indicate overfitting and that the model has poor ability to generalize. However, minimal difference (&#x394;<italic>R</italic>
<sup>2</sup> &lt; 0.01) was observed in performance on testing versus validation data. This indicates that the model is not overfitted, generalized well, and can be expected to perform similarly (as it did on the test data) on new data (<xref ref-type="bibr" rid="B27">Domingos, 2012</xref>).</p>
<p>For pH, the best-performing model was the RF model that included three variables with an <italic>R</italic>
<sup>2</sup> = 0.96. (pH RF 3; <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The second-best performing model with <italic>R</italic>
<sup>2</sup> = 0.975 was the MLR model with all variables, which, in order of importance, are DO, temperature, pressure, and salinity (pH MLR 4). The RF models outperformed the MLR models for pH prediction, but again by a narrow gap. Differences were observed in performance on validation and test datasets of <italic>R</italic>
<sup>2</sup> &gt; 0.6, indicating which models may be slightly overfitted. The RF model containing all four variables performed poorly, possibly due to overfitting or collinearity and thus is not included.</p>
<p>All residuals indicated nonnormality as seen in QQ-plots, histograms, and through Shapiro-Wilks <italic>p</italic>-values &lt; 0.05 (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures S1</bold>
</xref>&#x2013;<xref ref-type="supplementary-material" rid="SM1">
<bold>S8</bold>
</xref>). To further investigate the non-normality of residuals and determine if it could be an indicator of other problems, the Durbin-Watson and Breusch-Pagan tests were used to test the assumptions for independent and homoscedastic residuals. A Durbin-Watson test for independence resulting in a value close to 2 suggests that the residuals an autocorrelated. Breusch&#x2013;Pagan test for homoscedasticity, where a <italic>p</italic> &gt; 0.05 suggests homoscedasticity. Therefore, despite the nonnormality of the residuals, it is unlikely to be problematic due to their independence, homoscedasticity, the size of the dataset, and the robust nature of the models (<xref ref-type="bibr" rid="B9">Breiman, 2001</xref>).</p>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<sec id="s4_1">
<title>Data selection considerations</title>
<p>The nwGOM area (latitudes 27.1&#x2013;29.0&#x2da;N and longitudes 89&#x2013;95.1&#x2da;W) was selected to isolate a relatively small geographic area where controlling factors on the carbonate system are expected to remain similar in the examined window of time and included the same stations surveyed repeatedly along the same transect (i.e., the 90&#xb0; line). This study area lies almost entirely on the Texas shelf and far enough to the west so that the effects of the freshwater discharge transported westward are less pronounced than on the bulk of the Louisiana Shelf (<xref ref-type="bibr" rid="B3">Androulidakis et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B53">Morey et&#xa0;al., 2003</xref>). Under heavy influence from the large river&#x2019;s watershed, salinity would be a key variable for models, although it is not detected as such in our models. Therefore, salinity was only included as a predictor variable in one of the &#x2126;<sub>Arag</sub> models and only half of the pH models.</p>
<p>Removal of the surface layer of the water column was done strategically to remove large, short-term temporally unconstrained variabilities, such as surface water gas exchange, physical, biological, and seasonal changes (<xref ref-type="bibr" rid="B43">Juranek et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>). In the nwGOM, removal of shallow water can potentially mitigate the minimal effects of freshwater outflow as the low-salinity river discharge is buoyant. Removal of surface water can be less important when air-surface water interactions do not affect predictor variables. Even still, removal can serve as a means of removing the effect of seasonality, though depth ranges of the mixed layer to be removed vary by location and season (<xref ref-type="bibr" rid="B43">Juranek et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B52">Montes et&#xa0;al., 2016</xref>). Since most of the models produced in this study contain DO, removing air-sea interaction was necessary. Based on the final models chosen for &#x2126;<sub>Arag</sub> and pH, the relationships showed that the exclusion of the upper 30 m of the water column did improve the performance of all &#x2126;<sub>Arag</sub> models. When models are compared with the model containing the same spatial data but all depths, models with the upper 30 m removed, except for pH MLR models, had either greater R<sup>2</sup>, lower MSE or MAPE, or a combination of the three (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>). The improvements in all models indicate that the removal of surface water increases the performance of the models, though it should be noted that there may be bias across seasons due to unaccounted-for surface water and mixed-layer inclusion in the datasets used for training. Seasonal bias could also occur due to a greater quantity of summer observations in the training dataset. Further data beyond the 2007&#x2013;2023 time series, as well as the inclusion of more seasonal data, are needed to properly assess the potential existence of these biases.</p>
</sec>
<sec id="s4_2">
<title>Aragonite models</title>
<p>There are many known relationships between &#x2126;<sub>Arag</sub> and physical and chemical parameters, which is why the variables salinity, temperature, pressure, and DO were chosen in developing &#x3a9;<sub>Arag</sub> models. However, the degree to which each of these variables is intertwined with &#x2126;<sub>Arag</sub> is not so easy to identify but can be inferred by their selection and importance in the models with the highest performance.</p>
<p>Temperature was the most prominent predictor for &#x2126;<sub>Arag</sub> in all models (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The strength of the relationship can be explained by &#x2126;<sub>Arag</sub> as a function of K<sub>sp</sub> and [CO<sub>3</sub>
<sup>2&#x2212;</sup>], and K<sub>sp</sub> as a function of temperature, salinity, and pressure. Temperature as a dominant predictor variable aligns well with models built for &#x2126;<sub>Arag</sub> prediction in other areas, which also found temperature to be a primary predictor for &#x2126;<sub>Arag</sub> (<xref ref-type="bibr" rid="B1">Alin et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B43">Juranek et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>). Pressure was included in all MLR models and two out of three RF models (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The pressure term in the models can be in part explained by &#x2126;<sub>Arag</sub> as a function of K<sub>sp</sub> and [CO<sub>3</sub>
<sup>2&#x2212;</sup>], and K<sub>sp</sub> is also a function of pressure, that is, increasing solubility with depth. DO was included in both MLR models and one RF model (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The inclusion of DO is likely due to the close coupling of DO and DIC in subsurface waters, which includes CO<sub>2</sub> uptake (photosynthesis) and release (respiration) and lacks exchange with the atmosphere in the subsurface (&gt;30 m). Although salinity was also tested, it was only included in one MLR model based on selection criteria and was the least important predictor variable by coefficient (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). The lack of salinity could be in part because salinity in the modeled dataset has small variability from 33.2 to 36.7 without outliers and an interquartile range (IQR) of from 35.2 to 36.4. This means salinity has a relatively small contribution to variability, either due to the hydrography of the area or possibly in part to the limitation of the dataset&#x2019;s spatial and depth coverage. By focusing on the nwGOM and removing the upper 30 m it is possible that freshwater outflow transported from the Mississippi-Atchafalaya watershed westward over the Louisiana-Texas shelf in the surface water has been partially or wholly avoided (<xref ref-type="bibr" rid="B53">Morey et&#xa0;al., 2003</xref>).</p>
</sec>
<sec id="s4_3">
<title>pH models</title>
<p>Although anthropogenic CO<sub>2</sub> is the dominant driver for long&#x2010;term, that is, multidecadal, change in pH in the upper ocean water column, the variations observed in coastal waters on decadal time scales are largely attributed to driving forces including production shift due to changes in nutrient input (<xref ref-type="bibr" rid="B73">Wang et&#xa0;al., 2013</xref>) and ocean circulation changes (e.g., upwelling) (<xref ref-type="bibr" rid="B32">Feely et&#xa0;al., 2008</xref>) and terrestrial influences (<xref ref-type="bibr" rid="B11">Cai, 2003</xref>; <xref ref-type="bibr" rid="B28">Duarte et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B33">Gomez et&#xa0;al., 2021</xref>). The fact that DO was included as an important predictor variable suggests that biological activities are a major driving force for the carbonate system. Similarly, DO was also found to be the strongest predictor of pH in the Northeast US (<xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>). Pressure was also important in all the models, as carbonate system equilibria are affected by pressure (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). There is a visually notable trend of overprediction of pH from 400 to 800 m; this is an area with lower pH and &#x3a9; than the rest of the water column. We attribute this bias to the non-linearity of the carbonate system. This type of bias has also been seen in other similar models in different geographic locations as well (<xref ref-type="bibr" rid="B42">Juranek et&#xa0;al., 2011</xref>, <xref ref-type="bibr" rid="B43">2009</xref>).</p>
</sec>
<sec id="s4_4">
<title>Comparison with previous models</title>
<p>One of the primary motivations behind the use of the MLR modeling with standardized variables is the ability to use empirical relationships among predictor variables to accurately describe the controlling processes in the study area, whereas RF modeling can only provide relative feature importance, which is not a quantification of the correlation between variables but of the relative impact on the performance of the model, or reduced impurity, that can be attributed to that predictor variable (<xref ref-type="bibr" rid="B9">Breiman, 2001</xref>). Due to standardization, the strength of the predictor variable correlation with the target variable can be inferred by the absolute value of the coefficients of predictor variables included in the models. However, it is important to note that statistical models reflect correlations between predictor variables and target variables but do not necessarily reveal mechanistic relationships (<xref ref-type="bibr" rid="B62">Quinn and Keough, 2002</xref>) (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>).</p>
<p>Because of differences in hydrography, river influences, and location of the drivers of the carbonate system, statistical models for carbonate system parameters are often specific to the geographic areas where they were created for. Although many of the primary drivers of the carbonate system remain the same, the secondary variables shift, as does the degree to which they influence.</p>
<p>In the literature, &#x2126;<sub>Arag</sub> models have been created for the northwestern Atlantic (<xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>), northern Gulf of Alaska (<xref ref-type="bibr" rid="B30">Evans et&#xa0;al., 2013</xref>), Central Oregon Coast (<xref ref-type="bibr" rid="B42">Juranek et&#xa0;al., 2011</xref>, <xref ref-type="bibr" rid="B43">2009</xref>), southern California Current system (<xref ref-type="bibr" rid="B1">Alin et&#xa0;al., 2012</xref>), Queen Charlotte Sound (<xref ref-type="bibr" rid="B36">Hare et&#xa0;al., 2025</xref>), U.S. east coast (<xref ref-type="bibr" rid="B46">Li et&#xa0;al., 2022</xref>), and the Sea of Japan (East Sea) (<xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>). These models all have between two and three variables and an adjusted <italic>R</italic>
<sup>2</sup> &#x2265; 0.91 compared to between one and four variables with an adjusted R<sup>2</sup> &#x2265; 0.94 in this study. The primary predictor variable in all previous models except two (<xref ref-type="bibr" rid="B30">Evans et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B42">Juranek et&#xa0;al., 2011</xref>) is temperature, as is the case in this study. Most models also include some combination of temperature with salinity, oxygen, and interaction terms; one model also used pressure (<xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>), and one used NO<sub>3</sub>
<sup>-</sup> (<xref ref-type="bibr" rid="B30">Evans et&#xa0;al., 2013</xref>). The models created here and those created previously for &#x2126;<sub>Arag</sub> agreed on the use of temperature as a primary predictor variable in combination with other predictor variables.</p>
<p>pH models have been created for the eastern US coast (<xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B46">Li et&#xa0;al., 2022</xref>), the northeast Pacific (<xref ref-type="bibr" rid="B42">Juranek et&#xa0;al., 2011</xref>), the southern California Current System (<xref ref-type="bibr" rid="B1">Alin et&#xa0;al., 2012</xref>), Queen Charlotte Sound (<xref ref-type="bibr" rid="B36">Hare et&#xa0;al., 2025</xref>), and the global ocean (<xref ref-type="bibr" rid="B14">Carter et al., 2021</xref>). All those models also used temperature and DO (<xref ref-type="bibr" rid="B1">Alin et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B42">Juranek et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B46">Li et&#xa0;al., 2022</xref>), with one model also using an interaction term between DO and temperature (<xref ref-type="bibr" rid="B1">Alin et&#xa0;al., 2012</xref>), one using nutrients, salinity, and multiple interaction terms (<xref ref-type="bibr" rid="B50">McGarry et&#xa0;al., 2021</xref>) and, lastly, one using AOU and salinity (<xref ref-type="bibr" rid="B36">Hare et&#xa0;al., 2025</xref>). They included between two and seven variables and resulted in adjusted <italic>R</italic>
<sup>2</sup> &#x2265; 0.89 in comparison to our models, which have between three and four variables and adjusted <italic>R</italic>
<sup>2</sup> &#x2265; 0.93. Our MLR models are consistent with previous models that DO was an important predictor variable for pH.</p>
</sec>
<sec id="s4_5">
<title>Model applicability</title>
<p>The GOMECC-1 survey in 2007 was among the first to collect comprehensive, high-quality, measurements of the inorganic carbonate system parameters in the GOM. However, the capacity for autonomous observation of ocean carbonate chemistry is growing rapidly. By combining real-time, high-resolution data with modeling methods, it is possible to create comprehensive data coverage while simultaneously providing data validation via comparison between different data sources. With the use of MLR in combination with a single Argo profile float containing DO and temperature sensors, <xref ref-type="bibr" rid="B42">Juranek et&#xa0;al. (2011)</xref> were able to create a 14-month comprehensive time series containing &#x2126;<sub>Arag</sub> and pH, which were verified by comparisons to independently measured values. <xref ref-type="bibr" rid="B30">Evans et&#xa0;al. (2013)</xref> applied models to field data from glider flight and a GLOBEC mesoscale SeaSoar survey (<xref ref-type="bibr" rid="B19">Cowles, 2002</xref>) to create complete datasets, allowing for identification of variability of &#x2126;<sub>Arag</sub>. <xref ref-type="bibr" rid="B36">Hare et&#xa0;al. (2025)</xref> also had success with this in Queen Charlotte Sound, British Columbia, where regression models were applied to regional autonomous glider data. Although autonomous measurements for biogeochemical parameters in the GOM have just begun (<xref ref-type="bibr" rid="B57">Osborne et&#xa0;al., 2024</xref>), successful combination of models and autonomous data collection should greatly improve geochemical data coverage and advance carbonate chemistry studies.</p>
<p>In addition to long-term changes, there is strong motivation to apply empirical models to year-round hydrographic data to reconstruct the seasonal cycle of carbonate chemistry. For example, <xref ref-type="bibr" rid="B43">Juranek et&#xa0;al. (2009)</xref> created a model using data collected in spring and successfully used it to predict the seasonal changes in &#x2126;<sub>Arag</sub> under the assumption that the seasonal variability of the primary independent variables (temperature and DO) would be comparable to the variations encountered spatially during the initial data collection. One method to mitigate effects of the lack of seasonal variation data on the relationships between physical and chemical data is by excluding depths influenced by local meteorological conditions from the analysis (<xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>). Most models were calibrated using mostly summer data and none with subsurface seasonal data for the GOM. Our models contain data from all seasons with slightly more data points from summer months. Seasonal application is expected to be viable in the produced models for pH as it was explained primarily by biologically driven changes, that is, the coupling between DIC and DO. Seasonal application is also expected to be viable for &#x3a9;<sub>Arag</sub> at depths of 30&#x2013;300 m, as biological changes are primarily driven by DIC rather than TA (<xref ref-type="bibr" rid="B4">Angl&#xe8;s et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B39">Hu et&#xa0;al., 2018</xref>). It is expected that changes in DIC should be captured in these models due to their relationship with DO in the subsurface (<xref ref-type="bibr" rid="B2">Anderson and Sarmiento, 1994</xref>; <xref ref-type="bibr" rid="B35">Hales et&#xa0;al., 2005</xref>).</p>
<p>Furthermore, there is also motivation to apply statistical models to forecast the carbonate system conditions as OA progresses. Previously created MLRs have been applied to generate hindcasts (up to 40 years) on carbonate chemistry (<xref ref-type="bibr" rid="B30">Evans et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B44">Kim et&#xa0;al., 2010</xref>). However, the temporal applicability of a model is expected to be limited. To use the model for predictions beyond the timeframe of training data, even with relatively unchanged circulation and watershed conditions, it is necessary to make corrections for shifts caused by changes in the anthropogenic CO<sub>2</sub> inventory in the water column, increasing error beyond model uncertainty. This is because empirical models do not account for anthropogenic addition of CO<sub>2</sub>, which changes the ratio of DIC/DO. Due to atmospheric CO<sub>2</sub> input, previous modeling studies have calculated that the statistical relationships will need to be updated every 5<bold>&#x2013;</bold>10 years to account for changes in target variables (<xref ref-type="bibr" rid="B1">Alin et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B42">Juranek et&#xa0;al., 2011</xref>, <xref ref-type="bibr" rid="B43">2009</xref>). The models can be used for estimation of data within the timeframe of the training data (2007&#x2013;2023), with the requirement that seasonality or waterbody changes are captured, hindcasting up to 10 years (1997&#x2013;2007), and predicting up to 10 years (2023&#x2013;2033) (<xref ref-type="bibr" rid="B42">Juranek et&#xa0;al., 2011</xref>). For example, <xref ref-type="bibr" rid="B43">Juranek et&#xa0;al. (2009)</xref> created a model using data collected in spring, and they successfully used it to predict the seasonal changes in &#x2126;<sub>Arag.</sub> The assumption of this study was that the seasonal variability of the primary independent variables (temperature and DO) would be comparable to the variation encountered spatially during the initial data collection just a year prior. However, to extend the reconstruction further than 10 years, it would be necessary to account for the progressive addition of anthropogenic CO<sub>2</sub> to the water column over time. For example, <xref ref-type="bibr" rid="B44">Kim et&#xa0;al. (2010)</xref> used estimates of anthropogenic CO<sub>2</sub> invasion to subtract anthropogenic CO<sub>2</sub> and apply modeling estimates of DIC in the Sea of Japan (East Sea) to create a 40-year reconstruction. In our study, the total uncertainty values are 0.12 for &#x2126;<sub>Arag</sub> and 0.0173 for pH. The rate of pH decline at the surface during the 2013&#x2013;2022 period is 0.0025 &#xb1; 0.0005 year<sup>1&#x2212;</sup>, while there is no discernable trend in &#x2126;<sub>Arag</sub> (Hu, unpublished data). Based on this, it would take 14 years for the accumulation of anthropogenic carbon to surpass two times the uncertainty for pH (i.e., the time of emergence, <xref ref-type="bibr" rid="B69">Turk et&#xa0;al., 2019</xref>). Due to the lack of trend in &#x3a9;<sub>Arag</sub>, these models could be applicable for a longer period in this region. However, we recommend conservatively applying caution when using beyond the 10-year window. For all models but particularly &#x3a9;<sub>Arag,</sub> it seems likely that other factors such as changing climatology may be the first to influence model applicability rather than anthropogenic CO<sub>2</sub> intrusion.</p>
</sec>
<sec id="s4_6">
<title>Data scarcity</title>
<p>Technological advancements (e.g., satellites, floats, and gliders) have made autonomous measurements for selected variables possible. Even though satellites provide large volumes of invaluable data, their scope is limited not only to the surface layer but also to measurements of temperature and ocean color, which can be used for estimations of productivity, dissolved organic matter, and sea surface CO<sub>2</sub> partial pressure (e.g., <xref ref-type="bibr" rid="B18">Chen et&#xa0;al., 2019</xref>). Some remedies for the lack of data beyond the surface have come in the form of novel technologies, including Argo floats and gliders (<xref ref-type="bibr" rid="B57">Osborne et&#xa0;al., 2024</xref>). The Argo array supports more than 3,000 floats across the global ocean, supplying profiles of T and S, of which about 200 are also equipped with a DO sensor. Biogeochemical-Argo (BGC-Argo) floats can take measurements from the surface to 2,000 dbar and provide high-resolution autonomous measurements for some combinations of chlorophyll, particle backscatter, DO, nitrate, pH, or irradiance (<xref ref-type="bibr" rid="B63">Roemmich et&#xa0;al., 2019</xref>). Nevertheless, this equipment is limited in coverage ability; BGC-Argos have yet to reach the comprehensive coverage of traditional Argos, and they usually do not operate on continental shelves. Gliders share the similar biogeochemical sensors used by the BGC-Argo floats with a similar mode of operation but perform sawtooth trajectories from the surface to the bottom, or to 200&#x2013;1,000 m depth, and their deployments are limited largely by biofouling, battery life, and payload space, hindering their ability to carry many sensors (<xref ref-type="bibr" rid="B64">Saba et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B67">Testor et&#xa0;al., 2019</xref>). Additionally, all data from floats and gliders must undergo rigorous quality control and correction of potential errors in sensors, such as drift and be compared to lab-measured samples when possible (<xref ref-type="bibr" rid="B63">Roemmich et&#xa0;al., 2019</xref>).</p>
<p>Given the performance of the models created here, it would be reasonable to expect that in combination with datasets from data collection via these platforms, one or both of pH and &#x2126;<sub>Arag</sub> could be estimated. Traditional Argos, as well as most gliders, have temperature and pressure (or depth) measurements, meaning &#x3a9;<sub>Arag</sub> could be estimated using either of the two RF models with <italic>R</italic>
<sup>2</sup> values of 0.94 and 0.97. With the addition of DO, which is included in a subset of the Argos and in the BGC-Argos, the &#x2126;<sub>Arag</sub> model with an <italic>R</italic>
<sup>2</sup> of 0.98 could be applied. Additionally, the pH model with <italic>R</italic>
<sup>2</sup> of 0.94 could be used; even though pH sensors are included in many BGC-Argos, the modeled results could provide robust data quality check capability.</p>
</sec>
<sec id="s4_7">
<title>Recommendations</title>
<p>The models developed in this study serve as valuable tools for reconstructing pH and &#x3a9;<sub>Arag</sub> data in the absence of direct chemical observations, leveraging available hydrographic information. The models can also be used for hindcasting over a 10-year period (1997&#x2013;2007) and for forecasting over the next ~10 years (2023&#x2013;2033) in the nwGOM, if seasonality and watermass changes are adequately captured. Through modeling, our results showed that RF models do not have any distinct advantage over the MLR models which are commonly used. It is crucial to examine potential shifts in circulation, water mass composition, and anthropogenic CO<sub>2</sub> accumulation to refine and update the models over time. Despite their robustness, several potential issues remain across all models, suggesting room for improvement, such as difficulties estimating target variables due to significant variation in the shallow and mixed layers, a need for additional data points, or the application of more complex models. Future work to enhance these models could involve incorporating additional data, as well as exploring the application of neural network AI models and locally interpolated regressions, such as those employed by <xref ref-type="bibr" rid="B14">Carter et al. (2021)</xref>.</p>
</sec>
</sec>
</body>
<back>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are publicly available. This data can be found here: <uri xlink:href="https://github.com/ejundt/XRModel.git">https://github.com/ejundt/XRModel.git</uri> and <uri xlink:href="https://wq.gcoos.org/oa/data/csv/">https://wq.gcoos.org/oa/data/csv/</uri>. Publicly available datasets were analyzed in this study. This data can be found here: <uri xlink:href="https://glodap.info/">https://glodap.info/</uri>.</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>EJ: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Software, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. XH: Conceptualization, Funding acquisition, Resources, Supervision, Writing &#x2013; review &amp; editing.</p>
</sec>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research and/or publication of this article. This study was funded by NOAA Ocean Acidification Program (award #NA19OAR0170354).</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>This publication was made possible by the National Oceanic and Atmospheric Administration, Office of Education Educational Partnership Program with Minority Serving Institutions award (NA21SEC4810004). We would like to thank Steven DiMarco, Piers Chapman, Sakib Mahmud, students and postdocs from Texas A&amp;M University, and the captain and crew on board R/V Pelican for their assistance with sample collection and analyses. We would also like to thank the scientific party on previous GOMECC cruises for their contributions to the data used in this study.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Author disclaimer</title>
<p>Its contents are solely the responsibility of the award recipient and do not necessarily represent the official views of the U.S. Department of Commerce, National Oceanic and Atmospheric Administration.</p>
</sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmars.2025.1621280/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmars.2025.1621280/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.pdf" id="SM1" mimetype="application/pdf"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alin</surname> <given-names>S. R.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Dickson</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Mart&#xed;n Hern&#xe1;ndez-Ay&#xf3;n</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Juranek</surname> <given-names>L. W.</given-names>
</name>
<name>
<surname>Ohman</surname> <given-names>M. D.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Robust empirical relationships for estimating the carbonate system in the southern California Current System and application to CalCOFI hydrographic cruise data, (2005&#x2013;2011)</article-title>. <source>J. Geophys Res. Oceans</source> <volume>117</volume>, <fpage>5033</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2011JC007511</pub-id>
</citation></ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anderson</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Sarmiento</surname> <given-names>J. L.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Redfield ratios of remineralization determined by nutrient data analysis</article-title>. <source>Global Biogeochem Cycles</source> <volume>8</volume>, <fpage>65</fpage>&#x2013;<lpage>80</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/93GB03318</pub-id>
</citation></ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Androulidakis</surname> <given-names>Y. S.</given-names>
</name>
<name>
<surname>Kourafalou</surname> <given-names>V. H.</given-names>
</name>
<name>
<surname>Schiller</surname> <given-names>R. V.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Process studies on the evolution of the Mississippi River plume: Impact of topography, wind and discharge conditions</article-title>. <source>Cont Shelf Res.</source> <volume>107</volume>, <fpage>33</fpage>&#x2013;<lpage>49</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.csr.2015.07.014</pub-id>
</citation></ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Angl&#xe8;s</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Jordi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Henrichs</surname> <given-names>D. W.</given-names>
</name>
<name>
<surname>Campbell</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Influence of coastal upwelling and river discharge on the phytoplankton community composition in the northwestern Gulf of Mexico</article-title>. <source>Prog. Oceanogr</source> <volume>173</volume>, <fpage>26</fpage>&#x2013;<lpage>36</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pocean.2019.02.001</pub-id>
</citation></ref>
<ref id="B5">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Barbero</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Pierrot</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Baringer</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hooper</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J. Z.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <source>Cruise Report: Third Gulf of Mexico Ecosystems and Carbon Cycle (GOMECC-3) Cruise</source>. <publisher-loc>Miami, FL 33149</publisher-loc>: <publisher-name>NOAA Atlantic Oceanographic and Meteorological Laboratory</publisher-name>. doi:&#xa0;<pub-id pub-id-type="doi">10.25923/y6m9-fy08</pub-id>
</citation></ref>
<ref id="B6">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Barbero</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Stefanick</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hooper</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Baringer</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>I.</given-names>
</name>
<etal/>
</person-group>. (<year>2024</year>). <source>Cruise Report: Fourth Gulf of Mexico Ecosystems and Carbon Cycle (GOMECC-4) Cruise</source>. <publisher-name>Atlantic Oceanographic and Meteorological Laboratory</publisher-name>, <publisher-loc>Miami, FL 33149</publisher-loc>. doi:&#xa0;<pub-id pub-id-type="doi">10.25923/rwx5-s713</pub-id>
</citation></ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bednar&#x161;ek</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Tarling</surname> <given-names>G. A.</given-names>
</name>
<name>
<surname>Bakker</surname> <given-names>D. C. E.</given-names>
</name>
<name>
<surname>Fielding</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Jones</surname> <given-names>E. M.</given-names>
</name>
<name>
<surname>Venables</surname> <given-names>H. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Extensive dissolution of live pteropods in the Southern Ocean</article-title>. <source>Nat. Geosci</source> <volume>5</volume>, <fpage>881</fpage>&#x2013;<lpage>885</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/NGEO1635</pub-id>
</citation></ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bostock</surname> <given-names>H. C.</given-names>
</name>
<name>
<surname>Mikaloff Fletcher</surname> <given-names>S. E.</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>M. J. M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Estimating carbonate parameters from hydrographic data for the intermediate and deep waters of the Southern Hemisphere oceans</article-title>. <source>Biogeosciences</source> <volume>10</volume> (<issue>10</issue>), <fpage>6199</fpage>&#x2013;<lpage>6213</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/BG-10-6199-2013</pub-id>
</citation></ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1010933404324/METRICS</pub-id>
</citation></ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burnham</surname> <given-names>K. P.</given-names>
</name>
<name>
<surname>Anderson</surname> <given-names>D. R.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Multimodel inference: understanding AIC and BIC in model selection</article-title>. <source>Sociological Methods &amp; Research</source> <volume>33</volume>, <fpage>261</fpage>&#x2013;<lpage>304</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/0049124104268644</pub-id>
</citation></ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Riverine inorganic carbon flux and rate of biological uptake in the Mississippi River plume</article-title>. <source>Geophys Res. Lett.</source> <volume>30</volume>, <fpage>1032</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2002GL016312</pub-id>
</citation></ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Murrell</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Lehrter</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Lohrenz</surname> <given-names>S. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2011</year>). <article-title>Acidification of subsurface coastal waters enhanced by eutrophication</article-title>. <source>Nat. Geosci.</source> <volume>11</volume>, <fpage>766</fpage>&#x2013;<lpage>770</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ngeo1297</pub-id>
</citation></ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Y. Y.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
<name>
<surname>J&#xf6;nsson</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Alin</surname> <given-names>S. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Controls on surface water carbonate chemistry along North American ocean margins</article-title>. <source>Nat. Commun.</source> <volume>11</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-020-16530-z</pub-id>, PMID: <pub-id pub-id-type="pmid">32483136</pub-id></citation></ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carter</surname> <given-names>B. R.</given-names>
</name>
<name>
<surname>Bittig</surname> <given-names>H. C.</given-names>
</name>
<name>
<surname>Fassbender</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Sharp</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Takeshita</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Y.-Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>New and updated global empirical seawater property estimation routines</article-title>. <source>Limnology and Oceanography: Methods</source>. <volume>19</volume>,  <fpage>785</fpage>&#x2013;<lpage>809</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/lom3.10461</pub-id>
</citation></ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carter</surname> <given-names>B. R.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>N. L.</given-names>
</name>
<name>
<surname>Dickson</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Fong</surname> <given-names>M. B.</given-names>
</name>
<name>
<surname>Takeshita</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Updated methods for global locally interpolated estimation of alkalinity, pH, and nitrate</article-title>. <source>Limnol Oceanogr Methods</source> <volume>16</volume>, <fpage>119</fpage>&#x2013;<lpage>131</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/LOM3.10232;JOURNAL:JOURNAL:15415856;WGROUP:STRING:PUBLICATION</pub-id>
</citation></ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carter</surname> <given-names>B. R.</given-names>
</name>
<name>
<surname>Sharp</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Dickson</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>&#xc1;lvarez</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Fong</surname> <given-names>M. B.</given-names>
</name>
<name>
<surname>Garc&#xed;a-Ib&#xe1;&#xf1;ez</surname> <given-names>M. I.</given-names>
</name>
<etal/>
</person-group>. (<year>2024</year>). <article-title>Uncertainty sources for measurable ocean carbonate chemistry variables</article-title>. <source>Limnol Oceanogr</source> <volume>69</volume>, <fpage>1</fpage>&#x2013;<lpage>21</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/LNO.12477</pub-id>
</citation></ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>The marine carbonate system of the Arctic Ocean: Assessment of internal consistency and sampling considerations, summer 2010</article-title>. <source>Mar. Chem.</source> <volume>176</volume>, <fpage>174</fpage>&#x2013;<lpage>188</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/J.MARCHEM.2015.09.007</pub-id>
</citation></ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Barnes</surname> <given-names>B. B.</given-names>
</name>
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W.-J.</given-names>
</name>
<name>
<surname>Barbero</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>A machine learning approach to estimate surface ocean pCO 2 from satellite measurements</article-title>. <source>Remote Sens Environ.</source> <volume>228</volume>, <fpage>203</fpage>&#x2013;<lpage>226</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2019.04.019</pub-id>
</citation></ref>
<ref id="B19">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cowles</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2002</year>). <source>GLOBEC Northeast Pacific California Current Cruise Report, R/V Thomas G. Thompson (T0205) Alternative Cruise ID: Mesoscale Survey TN147 Chief Scientist: Cruise Objectives</source>. <publisher-name>College of Oceanic and Atmospheric Sciences Oregon State University</publisher-name> <publisher-loc>Corvallis, OR</publisher-loc>.</citation></ref>
<ref id="B20">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Culberson</surname> <given-names>C. H.</given-names>
</name>
</person-group> (<year>1991</year>). <source>WHO Operations and Methods: Dissolved Oxygen. Newark</source>. <publisher-name>College of Marine Studies. University of Delaware</publisher-name>. <publisher-loc>Newark, U.S.A.</publisher-loc>
</citation></ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Culberson</surname> <given-names>C. H.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>An automated amperometric oxygen titration</article-title>. <source>Deep Sea Res.</source> <volume>34</volume>, <fpage>875</fpage>&#x2013;<lpage>880</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0198-0149(87)90042-2</pub-id>
</citation></ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cutler</surname> <given-names>D. R.</given-names>
</name>
<name>
<surname>Edwards</surname> <given-names>T. C.</given-names>
</name>
<name>
<surname>Beard</surname> <given-names>K. H.</given-names>
</name>
<name>
<surname>Cutler</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hess</surname> <given-names>K. T.</given-names>
</name>
<name>
<surname>Gibson</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2007</year>). <article-title>Random forests for classification in ecology</article-title>. <source>Ecology</source> <volume>88</volume>, <fpage>2783</fpage>&#x2013;<lpage>2792</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1890/07-0539.1</pub-id>, PMID: <pub-id pub-id-type="pmid">18051647</pub-id></citation></ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dickson</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Millero</surname> <given-names>F. J.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>A comparison of the equilibrium constants for the dissociation of carbonic acid in seawater media</article-title>. <source>Deep Sea Research Part A, Oceanographic Research Papers</source> <volume>34</volume> (<issue>10</issue>), <fpage>1733</fpage>&#x2013;<lpage>1743</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0198-0149(87)90021-5</pub-id>
</citation></ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dickson</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Wesolowski</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Mesmer</surname> <given-names>R. E.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>Dissociation constant of bisulfate ion in aqueous sodium chloride solutions to 250&#xb0;C</article-title>. <source>J. Physical Chem.</source> <volume>94</volume> (<issue>20</issue>), <fpage>7978</fpage>&#x2013;<lpage>7985</lpage>. doi:&#xa0;0.1021/J100383A042/ASSET/J100383A042.FP.PNG_V03
</citation></ref>
<ref id="B25">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Dickson</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Sabine</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Christian</surname> <given-names>J. R.</given-names>
</name>
</person-group> (<year>2007</year>). &#x201c;<article-title>Guide to best practices for ocean CO2 measurements</article-title>,&#x201d; in <source>PICES Special Publication, Guide to Best Practices for Ocean CO2 measurements</source> (<publisher-loc>North Pacific Marine Science Organization Sidney, British Columbia, Canada</publisher-loc>: <publisher-name>PICES Special Publication</publisher-name>).</citation></ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DiMarco</surname> <given-names>S. F.</given-names>
</name>
<name>
<surname>Strauss</surname> <given-names>J.</given-names>
</name>
<name>
<surname>May</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Mullins-Perry</surname> <given-names>R. L.</given-names>
</name>
<name>
<surname>Grossman</surname> <given-names>E. L.</given-names>
</name>
<name>
<surname>Shormann</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Texas coastal hypoxia linked to Brazos river discharge as revealed by oxygen isotopes</article-title>. <source>Aquat Geochem</source> <volume>18</volume>, <fpage>159</fpage>&#x2013;<lpage>181</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/S10498-011-9156-X/METRICS</pub-id>
</citation></ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Domingos</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>A few useful things to know about machine learning</article-title>. <source>Commun. ACM</source>. <volume>55</volume> (<issue>10</issue>), <fpage>78</fpage>&#x2013;<lpage>87</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/2347736.2347755</pub-id>
</citation></ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Duarte</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Hendriks</surname> <given-names>I. E.</given-names>
</name>
<name>
<surname>Moore</surname> <given-names>T. S.</given-names>
</name>
<name>
<surname>Olsen</surname> <given-names>Y. S.</given-names>
</name>
<name>
<surname>Steckbauer</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Ramajo</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title>Is ocean acidification an open-ocean syndrome? Understanding anthropogenic impacts on seawater pH</article-title>. <source>Estuaries Coasts</source> <volume>36</volume>, <fpage>221</fpage>&#x2013;<lpage>236</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/S12237-013-9594-3/TABLES/1</pub-id>
</citation></ref>
<ref id="B29">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Erez</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Reynaud</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Silverman</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Schneider</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Allemand</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2011</year>). &#x201c;<article-title>Coral calcification under ocean acidification and global change</article-title>,&#x201d; in <source>Coral Reefs: An Ecosystem in Transition</source> (<publisher-loc>Springer Dordrecht, Netherlands</publisher-loc>: <publisher-name>Springer Netherlands</publisher-name>), <fpage>151</fpage>&#x2013;<lpage>176</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-94-007-0114-4_10</pub-id>
</citation></ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Evans</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Mathis</surname> <given-names>J. T.</given-names>
</name>
<name>
<surname>Winsor</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Statscewich</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Whitledge</surname> <given-names>T. E.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>A regression modeling approach for studying carbonate system variability in the northern Gulf of Alaska</article-title>. <source>J. Geophys Res. Oceans</source> <volume>118</volume>, <fpage>476</fpage>&#x2013;<lpage>489</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2012JC008246</pub-id>
</citation></ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eyre</surname> <given-names>B. D.</given-names>
</name>
<name>
<surname>Andersson</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Cyronak</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Benthic coral reef calcium carbonate dissolution in an acidifying ocean</article-title>. <source>Nat. Climate Change</source> <volume>11</volume>, <fpage>969</fpage>&#x2013;<lpage>976</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nclimate2380</pub-id>
</citation></ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Sabine</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Hernandez-Ayon</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Ianson</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Hales</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Evidence for upwelling of corrosive &#x201c;acidified&#x201d; water onto the continental shelf</article-title>. <source>Science (1979)</source> <volume>320</volume>, <fpage>1490</fpage>&#x2013;<lpage>1492</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1155676</pub-id>, PMID: <pub-id pub-id-type="pmid">18497259</pub-id></citation></ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gomez</surname> <given-names>F. A.</given-names>
</name>
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Barbero</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>S. K.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Increasing river alkalinity slows ocean acidification in the northern Gulf of Mexico</article-title>. <source>Geophys Res. Lett.</source> <volume>48</volume>, <elocation-id>e2021GL096521</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2021GL096521</pub-id>
</citation></ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gran</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>1952</year>). <article-title>Determination of the equivalence point in potentiometric titrations</article-title>. <source>Part II Analyst</source> <volume>77</volume>, <fpage>661</fpage>&#x2013;<lpage>671</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1039/an9527700661</pub-id>
</citation></ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hales</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Takahashi</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Bandstra</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Atmospheric CO2 uptake by a coastal upwelling system</article-title>. <source>Global Biogeochem Cycles</source> <volume>19</volume>, <fpage>1</fpage>&#x2013;<lpage>11</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2004GB002295</pub-id>
</citation></ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hare</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Evans</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Dosser</surname> <given-names>H. V.</given-names>
</name>
<name>
<surname>Jackson</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Alin</surname> <given-names>S. R.</given-names>
</name>
<name>
<surname>Hannah</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2025</year>). <article-title>Regression-based characterization of the marine carbonate system across shelf and nearshore waters of Queen Charlotte Sound</article-title>. <source>Mar. Chem.</source> <volume>270</volume>, <elocation-id>104511</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/J.MARCHEM.2025.104511</pub-id>
</citation></ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoegh-Guldberg</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Mumby</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Hooten</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Steneck</surname> <given-names>R. S.</given-names>
</name>
<name>
<surname>Greenfield</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Gomez</surname> <given-names>E.</given-names>
</name>
<etal/>
</person-group>. (<year>2007</year>). <article-title>Coral reefs under rapid climate change and ocean acidification</article-title>. <source>Science</source> <volume>318</volume>, <fpage>1737</fpage>&#x2013;<lpage>1742</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/SCIENCE.1152509/SUPPL_FILE/HOEGH-GULDBERG.SOM.PDF</pub-id>
</citation></ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Rabalais</surname> <given-names>N. N.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Effects of eutrophication and benthic respiration on water column carbonate chemistry in a traditional hypoxic zone in the Northern Gulf of Mexico</article-title>. <source>Mar. Chem.</source> <volume>194</volume>, <fpage>33</fpage>&#x2013;<lpage>42</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/J.MARCHEM.2017.04.004</pub-id>
</citation></ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Nuttall</surname> <given-names>M. F.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Staryk</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>McCutcheon</surname> <given-names>M. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Seasonal variability of carbonate chemistry and decadal changes in waters of a marine sanctuary in the Northwestern Gulf of Mexico</article-title>. <source>Mar. Chem.</source> <volume>205</volume>, <fpage>16</fpage>&#x2013;<lpage>28</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.marchem.2018.07.006</pub-id>
</citation></ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Lohrenz</surname> <given-names>S. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>The response of inorganic carbon distributions and dynamics to upwelling-favorable winds on the northern Gulf of Mexico during summer</article-title>. <source>Cont Shelf Res.</source> <volume>111</volume>, <fpage>211</fpage>&#x2013;<lpage>222</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/J.CSR.2015.08.020</pub-id>
</citation></ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>King</surname> <given-names>A. E.</given-names>
</name>
<name>
<surname>Sieburth</surname> <given-names>J. M. N.</given-names>
</name>
</person-group> (<year>1985</year>). <article-title>Coulometric TCO2 analyses for marine studies; an introduction</article-title>. <source>Mar. Chem.</source> <volume>16</volume>, <fpage>61</fpage>&#x2013;<lpage>82</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0304-4203(85)90028-3</pub-id>
</citation></ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Juranek</surname> <given-names>L. W.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Gilbert</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Freeland</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>L. A.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Real-time estimation of pH and aragonite saturation state from Argo profiling floats: Prospects for an autonomous carbon observing strategy</article-title>. <source>Geophys Res. Lett.</source> <volume>38</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2011GL048580</pub-id>
</citation></ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Juranek</surname> <given-names>L. W.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Peterson</surname> <given-names>W. T.</given-names>
</name>
<name>
<surname>Alin</surname> <given-names>S. R.</given-names>
</name>
<name>
<surname>Hales</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>K.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>A novel method for determination of aragonite saturation state on the continental shelf of central Oregon using multi&#x2010;parameter relationships with hydrographic data</article-title>. <source>Geophys Res. Lett.</source> <volume>36</volume>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2009GL040778</pub-id>
</citation></ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>T. W.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Sabine</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C. T. A.</given-names>
</name>
<name>
<surname>Jeong</surname> <given-names>H. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2010</year>). <article-title>Prediction of Sea of Japan (East Sea) acidification over the past 40 years using a multiparameter regression model</article-title>. <source>Global Biogeochem Cycles</source> <volume>24</volume>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2009GB003637</pub-id>
</citation></ref>
<ref id="B45">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Kutner</surname> <given-names>M. H.</given-names>
</name>
<name>
<surname>Nachtsheim</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Neter</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2005</year>). <source>Applied linear statistical models</source> (<publisher-loc>McGraw-Hill/Irwin New York, NY, USA</publisher-loc>: <publisher-name>McGraw-Hill Irwin</publisher-name>).</citation></ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Y. Y.</given-names>
</name>
<name>
<surname>Kirchman</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Carbonate parameter estimation and its application in revealing temporal and spatial variation in the south and Mid-Atlantic Bight, USA</article-title>. <source>J. Geophys Res. Oceans</source> <volume>127</volume>, <elocation-id>e2022JC018811</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2022JC018811</pub-id>
</citation></ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lima</surname> <given-names>I. D.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z. A.</given-names>
</name>
<name>
<surname>Cameron</surname> <given-names>L. P.</given-names>
</name>
<name>
<surname>Grabowski</surname> <given-names>J. H.</given-names>
</name>
<name>
<surname>Rheuban</surname> <given-names>J. E.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Predicting carbonate chemistry on the northwest Atlantic shelf using neural networks</article-title>. <source>J. Geophys Res. Biogeosci</source> <volume>128</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2023JG007536</pub-id>
</citation></ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Patsavas</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Byrne</surname> <given-names>R. H.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Purification and characterization of meta-cresol purple for spectrophotometric seawater ph measurements</article-title>. <source>Environ. Sci. Technol.</source> <volume>45</volume>, <fpage>4862</fpage>&#x2013;<lpage>4868</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/es200665d</pub-id>, PMID: <pub-id pub-id-type="pmid">21563773</pub-id></citation></ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Massey</surname> <given-names>F. J.</given-names>
</name>
</person-group> (<year>1951</year>). <article-title>The Kolmogorov-Smirnov test for goodness of fit</article-title>. <source>J. Am. Stat. Assoc.</source> <volume>46</volume>, <fpage>68</fpage>&#x2013;<lpage>78</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/01621459.1951.10500769</pub-id>
</citation></ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McGarry</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Siedlecki</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>Salisbury</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Alin</surname> <given-names>S. R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Multiple linear regression models for reconstructing and exploring processes controlling the carbonate system of the northeast US from basic hydrographic data</article-title>. <source>J. Geophys Res. Oceans</source> <volume>126</volume>, <fpage>1</fpage>&#x2013;<lpage>19</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2020JC016480</pub-id>
</citation></ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mehrbach</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Culberson</surname> <given-names>C. H.</given-names>
</name>
<name>
<surname>Hawley</surname> <given-names>J. E.</given-names>
</name>
<name>
<surname>Pytkowicx</surname> <given-names>R. M.</given-names>
</name>
</person-group> (<year>1973</year>). <article-title>Measurement of the apparent dissociation constants of carbonic acid in seawater at atmospheric pressure</article-title>. <source>Limnology and Oceanography</source> <volume>18</volume> (<issue>6</issue>), <fpage>897</fpage>&#x2013;<lpage>907</lpage>.</citation></ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Montes</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Muller-Karger</surname> <given-names>F. E.</given-names>
</name>
<name>
<surname>Cianca</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lomas</surname> <given-names>M. W.</given-names>
</name>
<name>
<surname>Lorenzoni</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Habtes</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Decadal variability in the oxygen inventory of North Atlantic subtropical underwater captured by sustained, long-term oceanographic time series observations</article-title>. <source>Global Biogeochem Cycles</source> <volume>30</volume>, <fpage>460</fpage>&#x2013;<lpage>478</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/2015GB005183</pub-id>
</citation></ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Morey</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>Martin</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>O&#x2019;Brien</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>Wallcraft</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Zavala-Hidalgo</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Morey</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2003</year>). <article-title>Export pathways for river discharged fresh water in the northern Gulf of Mexico</article-title>. <source>J. Geophys Res. Oceans</source> <volume>108</volume>, <fpage>3303</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2002JC001674</pub-id>
</citation></ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muller-Karger</surname> <given-names>F. E.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Werner</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Roffer</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Natural variability of surface oceanographic conditions in the offshore Gulf of Mexico</article-title>. <source>Prog. Oceanogr</source> <volume>134</volume>, <fpage>54</fpage>&#x2013;<lpage>76</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pocean.2014.12.007</pub-id>
</citation></ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mucci</surname> <given-names>A.</given-names>
</name>
</person-group>. (<year>1983</year>). <article-title>The solubility of calcite and aragonite in seawater at various salinities, temperatures, and one atmosphere total pressure</article-title>. <source>American Journal of Science</source> <volume>283</volume>, <fpage>780</fpage>&#x2013;<lpage>799</lpage>.</citation></ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Orr</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Epitalon</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Dickson</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Gattuso</surname> <given-names>J. P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Routine uncertainty propagation for the marine carbon dioxide system</article-title>. <source>Mar. Chem.</source> <volume>207</volume>, <fpage>84</fpage>&#x2013;<lpage>107</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/J.MARCHEM.2018.10.006</pub-id>
</citation></ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Osborne</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Y. Y.</given-names>
</name>
<name>
<surname>Soden</surname> <given-names>M.</given-names>
</name>
<name>
<surname>McWhorter</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Barbero</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>A neural network algorithm for quantifying seawater pH using Biogeochemical-Argo floats in the open Gulf of Mexico</article-title>. <source>Front. Mar. Sci.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/FMARS.2024.1468909/BIBTEX</pub-id>
</citation></ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Patsavas</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Byrne</surname> <given-names>R. H.</given-names>
</name>
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Internal consistency of marine carbonate system measurements and assessments of aragonite saturation state: Insights from two U.S. coastal cruises</article-title>. <source>Mar. Chem.</source> <volume>176</volume>, <fpage>9</fpage>&#x2013;<lpage>20</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/J.MARCHEM.2015.06.022</pub-id>
</citation></ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pedregosa</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Duchesnay</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Varoquaux</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Gramfort</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Michel</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Thirion</surname> <given-names>B.</given-names>
</name>
<etal/>
</person-group>. (<year>2011</year>). <article-title>Scikit-learn</article-title>. <source>Journal of Machine Learning Research</source> <volume>12</volume>, <fpage>2825</fpage>&#x2013;<lpage>2830</lpage>.</citation></ref>
<ref id="B60">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Peng</surname> <given-names>T.-H.</given-names>
</name>
<name>
<surname>Langdon</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2007</year>). <source>Gulf of Mexico and East Coast Carbon Cruise (GOMECC) Chief Scientists: Tsung-Hung Peng and Chris Langdon NOAA Atlantic Oceanographic and Meteorological Laboratory Cruise Report</source>. <publisher-name>College of Marine Studies. University of Delaware</publisher-name>. <publisher-loc>Newark, U.S.A.</publisher-loc>
</citation></ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Probst</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wright</surname> <given-names>M. N.</given-names>
</name>
<name>
<surname>Boulesteix</surname> <given-names>A. L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Hyperparameters and tuning strategies for random forest</article-title>. <source>Wiley Interdiscip Rev. Data Min Knowl. Discov.</source> <volume>9</volume>, <elocation-id>e1301</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/WIDM.1301</pub-id>
</citation></ref>
<ref id="B62">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Quinn</surname> <given-names>G. P.</given-names>
</name>
<name>
<surname>Keough</surname> <given-names>M. J.</given-names>
</name>
</person-group> (<year>2002</year>). <source>Experimental Design and Data Analysis for Biologists</source> (<publisher-loc>Cambridge, England</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>).</citation></ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roemmich</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Alford</surname> <given-names>M. H.</given-names>
</name>
<name>
<surname>Claustre</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Johnson</surname> <given-names>K. S.</given-names>
</name>
<name>
<surname>King</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Moum</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>On the future of Argo: A global, full-depth, multi-disciplinary array</article-title>. <source>Front. Mar. Sci.</source> <volume>6</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/FMARS.2019.00439/BIBTEX</pub-id>
</citation></ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saba</surname> <given-names>G. K.</given-names>
</name>
<name>
<surname>Wright-Fairbanks</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Barnard</surname> <given-names>A. H.</given-names>
</name>
<name>
<surname>Jones</surname> <given-names>C. P.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>The development and validation of a profiling glider deep ISFET-based pH sensor for high resolution observations of coastal and ocean acidification</article-title>. <source>Front. Mar. Sci.</source> <volume>6</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/FMARS.2019.00664/BIBTEX</pub-id>
</citation></ref>
<ref id="B65">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Sharp</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Pierrot</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Orr</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Epitalon</surname> <given-names>J.-M.</given-names>
</name>
<name>
<surname>Humphreys</surname> <given-names>M. P.</given-names>
</name>
<name>
<surname>Wallace</surname> <given-names>D. W. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>). <source>CO2SYSv3 for MATLAB (Version v3.2.1)</source>. <publisher-name>European Organization for Nuclear Research</publisher-name>, <publisher-loc>Gen&#xe8;ve Switzerland</publisher-loc>.</citation></ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Takeshita</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Warren</surname> <given-names>J. K.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Spaulding</surname> <given-names>R. S.</given-names>
</name>
<name>
<surname>Byrne</surname> <given-names>R. H.</given-names>
</name>
<name>
<surname>Carter</surname> <given-names>B. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Consistency and stability of purified meta-cresol purple for spectrophotometric pH measurements in seawater</article-title>. <source>Mar. Chem.</source> <volume>236</volume>, <elocation-id>104018</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/J.MARCHEM.2021.104018</pub-id>
</citation></ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Testor</surname> <given-names>P.</given-names>
</name>
<name>
<surname>DeYoung</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Rudnick</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Glenn</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hayes</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>OceanGliders: A component of the integrated GOOS</article-title>. <source>Front. Mar. Sci.</source> <volume>6</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/FMARS.2019.00422/BIBTEX</pub-id>
</citation></ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thessen</surname> <given-names>A. E.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Adoption of machine learning techniques in ecology and earth science</article-title>. <source>One Ecosystem</source> <volume>1</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3897/oneeco.1.e8621</pub-id>
</citation></ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Turk</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Gledhill</surname> <given-names>D. K.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z. A.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Time of emergence of surface ocean carbon dioxide trends in the North American coastal margins in support of ocean acidification observing system design</article-title>. <source>Front. Mar. Sci</source>. <fpage>6</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2019.00091</pub-id>
</citation></ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Uppstr&#xf6;m</surname> <given-names>L. R.</given-names>
</name>
</person-group>. (<year>1974</year>). <article-title>The boron/chlorinity ratio of deep-sea water from the Pacific Ocean</article-title>. <source>DSRA</source> <volume>21</volume> (<issue>2</issue>), <fpage>161</fpage>&#x2013;<lpage>162</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0011-7471(74)90074-6</pub-id>
</citation></ref>
<ref id="B71">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>van Heuven</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Pierrot</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Rae</surname> <given-names>J. W. B.</given-names>
</name>
<name>
<surname>Lewis</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Wallace</surname> <given-names>D. W. R.</given-names>
</name>
</person-group> (<year>2011</year>). <source>MATLAB Program Developed for CO2 System Calculations</source>. <publisher-name>Carbon Dioxide Information Analysis Center, Oak Ridge National Laboratory, U.S. DoE</publisher-name>, <publisher-loc>Oak Ridge, TN</publisher-loc>.</citation></ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vujovic</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Classification model evaluation metrics</article-title>. <source>Int. J. Advanced Comput. Sci. Appl</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.14569/IJACSA.2021.0120670</pub-id>
</citation></ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>Z. A.</given-names>
</name>
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W. J.</given-names>
</name>
<name>
<surname>Byrne</surname> <given-names>R. H.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>T. H.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title>The marine inorganic carbon system along the Gulf of Mexico and Atlantic coasts of the United States: Insights from a transregional coastal carbon study</article-title>. <source>Limnol Oceanogr</source> <volume>58</volume>, <fpage>325</fpage>&#x2013;<lpage>342</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4319/lo.2013.58.1.0325</pub-id>
</citation></ref>
<ref id="B74">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wanninkhof</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Wood</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Barbero</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2012</year>). <source>Gulf of Mexico and East Coast Carbon Cruise #2 (GOMECC-2)</source> (<publisher-name>NOAA Atlantic Oceanographic and Meteorological Laboratory</publisher-name>).</citation></ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Winkler</surname> <given-names>L. W.</given-names>
</name>
</person-group> (<year>1888</year>). <article-title>The determination of oxygen dissolved in water</article-title>. <source>Rep. German Chem. Soc.</source> <volume>21</volume>, <fpage>2843</fpage>&#x2013;<lpage>2855</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cber.188802102122</pub-id>
</citation></ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zeebe</surname> <given-names>R. E.</given-names>
</name>
<name>
<surname>Ridgwell</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Zeebe</surname> <given-names>R. E.</given-names>
</name>
<name>
<surname>Ridgwell</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Past changes in ocean carbonate chemistry</article-title>. <source>Ocean Acidification</source> <volume>6</volume>, <fpage>21</fpage>&#x2013;<lpage>40</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/oso/9780199591091.003.0007</pub-id>
</citation></ref>
<ref id="B77">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Zeebe</surname> <given-names>R. E.</given-names>
</name>
<name>
<surname>Wolf-Gladrow</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2001</year>). <source>CO2 in Seawater: Equilibrium, Kinetics, Isotopes</source>. <edition>1st Edition</edition> Vol. <volume>65</volume> (<publisher-loc>Amsterdam, Netherlands</publisher-loc>: <publisher-name>Elsevier Science</publisher-name>). Available online at: <uri xlink:href="https://www.elsevier.com/books/co2-in-seawater-equilibrium-kinetics-isotopes/zeebe/978-0-444-50946-8">https://www.elsevier.com/books/co2-in-seawater-equilibrium-kinetics-isotopes/zeebe/978-0-444-50946-8</uri>.</citation></ref>
</ref-list>
</back>
</article>