<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2025.1729116</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>A data-driven approach to mesoscale ocean forecasting</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Oke</surname><given-names>Peter R.</given-names></name>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/625275/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Rykova</surname><given-names>Tatiana</given-names></name>
<uri xlink:href="https://loop.frontiersin.org/people/2349183/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><institution>Commonwealth Scientific and Industrial Research Organisation (CSIRO), Environment</institution>, <city>Hobart</city>, <state>TAS</state>,&#xa0;<country country="au">Australia</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Peter R. Oke, <email xlink:href="mailto:peter.oke@csiro.au">peter.oke@csiro.au</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2025-12-11">
<day>11</day>
<month>12</month>
<year>2025</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>12</volume>
<elocation-id>1729116</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>10</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>25</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>20</day>
<month>11</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Oke and Rykova.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Oke and Rykova</copyright-holder>
<license>
<ali:license_ref start_date="2025-12-11">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Accurate ocean forecasting is essential for many marine industries, including oil and gas, search and rescue, and Defence. Traditional forecasting systems typically produce analyses that are not dynamically consistent &#x2013; leading to initialisation shock that degrades forecasts. These systems are computationally intensive and generate vast amounts of data, making it difficult for end users to interpret and exploit. Here, we develop a data-driven alternative using analog forecasting. We use along-track sea-level anomaly observations to identify past ocean states that most closely match present conditions in a large archive of model simulations. These historical cases serve as analogs to the present state. The subsequent evolution of each analog is then assembled into an ensemble forecast. We generate 15-day sea-level anomaly forecasts for twelve 5<sup>&#xb0;</sup>x5<sup>&#xb0;</sup> regions around Australia and demonstrate that our system outperforms traditional operational forecasts in 40-60% of cases, performs equally well (no statistical difference) in about 30% of cases, and is outperformed in about 10-25% of cases. By offering a computationally efficient approach to predicting mesoscale ocean circulation, analog forecasting presents a viable and practical alternative or compliment for ocean prediction.</p>
</abstract>
<kwd-group>
<kwd>ocean forecasting</kwd>
<kwd>eddies</kwd>
<kwd>observations</kwd>
<kwd>analog forecasting</kwd>
<kwd>nearest neighbours</kwd>
<kwd>data assimilation</kwd>
</kwd-group>
<funding-group>
<award-group id="gs1">
<funding-source id="sp1">
<institution-wrap>
<institution>Commonwealth Scientific and Industrial Research Organisation</institution>
<institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100000943</institution-id>
</institution-wrap>
</funding-source>
</award-group>
<funding-statement>The author(s) declared financial support was received for this work and/or its publication. This work was supported by CSIRO.</funding-statement>
</funding-group>
<counts>
<fig-count count="14"/>
<table-count count="3"/>
<equation-count count="1"/>
<ref-count count="109"/>
<page-count count="24"/>
<word-count count="12346"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Physical Oceanography</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Ocean forecasting has improved significantly since its inception under the Global Ocean Data Assimilation Experiment (GODAE, <xref ref-type="bibr" rid="B96">Smith, 2000</xref>). However, several long-standing challenges remain. One fundamental challenge is the &#x201c;curse of dimensionality&#x201d; (<xref ref-type="bibr" rid="B19">Christiansen, 2018</xref>), where the large number of degrees of freedom in ocean models makes data assimilation and forecasting computationally intensive. The ocean is large, and scales that are most important to marine industries are short. As a result, simulating mesoscale processes in ocean general circulation models is computationally expensive. Additionally, when observations and model fields are combined using any method of sequential data assimilation, the resulting gridded analysis is usually not an exact solution to the model&#x2019;s equations. Initialising a model with such an analysis introduces artificial adjustments, often called &#x201c;initialisation shock&#x201d; (e.g., <xref ref-type="bibr" rid="B61">Malanotte-Rizzoli et&#xa0;al., 1989</xref>; <xref ref-type="bibr" rid="B7">Balmaseda et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B90">Sandery et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B4">Arango et&#xa0;al., 2023</xref>), that disrupts the model integration (e.g., <xref ref-type="bibr" rid="B23">Daley, 1981</xref>), leading to a degraded forecast (e.g., <xref ref-type="bibr" rid="B62">Martin et&#xa0;al., 2002</xref>; <xref ref-type="bibr" rid="B8">Balmaseda et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B82">Raghukumar et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B83">Raja et&#xa0;al., 2024</xref>).</p>
<p>In numerical weather prediction (NWP), various approaches mitigate the initialisation problem (e.g., <xref ref-type="bibr" rid="B99">Temperton and Williamson, 1981</xref>; <xref ref-type="bibr" rid="B59">Lynch and Huang, 1992</xref>; <xref ref-type="bibr" rid="B51">Kleist et&#xa0;al., 2009</xref>). While these methods do not entirely resolve the issue, they have significantly improved short-range (e.g., <xref ref-type="bibr" rid="B43">Hou et&#xa0;al., 2022</xref>) and medium-range (e.g., <xref ref-type="bibr" rid="B77">Peng et&#xa0;al., 2023</xref>) forecast skill. Ocean forecasting, however, generally employs less sophisticated initialisation techniques, including variants of incremental analysis updates (IAU; e.g., <xref ref-type="bibr" rid="B11">Bloom et&#xa0;al., 1996</xref>; <xref ref-type="bibr" rid="B33">Ferry et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B83">Raja et&#xa0;al., 2024</xref>; <xref ref-type="bibr" rid="B65">Mirouze et&#xa0;al., 2024</xref>), nudging (e.g., <xref ref-type="bibr" rid="B72">Oke et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B90">Sandery et&#xa0;al., 2011</xref>), and geostrophic or pressure adjustments (e.g., <xref ref-type="bibr" rid="B15">Burgers et&#xa0;al., 2002</xref>; <xref ref-type="bibr" rid="B104">Waters et&#xa0;al., 2017</xref>). These methods usually fail to fully eliminate initialisation errors, with forecasts often including a significant initialisation shock that degrades the quality of predictions at the start of each forecast. Metrics assessing ocean analysis and forecast errors consistently show a noticeable jump in error within the first day or so after a forecast is initialised (e.g., <xref ref-type="bibr" rid="B72">Oke et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B86">Ryan et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B82">Raghukumar et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B4">Arango et&#xa0;al., 2023</xref>). Evidence of this initialisation shock is seen in the results from a traditional ocean forecasting system that is used as the benchmark for forecast skill in this study.</p>
<p>Here, we develop a simple analog forecasting system that addresses the issues of dynamic consistency and cost-efficiency, to predict regional SLA. The idea behind analog forecasting is that &#x201c;history repeats itself&#x201d;. Analog weather forecasts are produced by objectively identifying a past atmospheric state that resembles current conditions (e.g., <xref ref-type="bibr" rid="B57">Lorenz, 1969</xref>). This past state is considered an analog to the present. The evolution of the atmosphere that immediately follows the identified historic analog, is offered as a forecast. The quality of the forecast depends on the quality of the analog.</p>
<p>This idea is not new. Throughout history, ancient civilisations practiced forms of weather forecasting based entirely on observation and experience (<xref ref-type="bibr" rid="B35">Green et&#xa0;al., 2010</xref>). By monitoring environmental patterns and recalling past occurrences, they anticipated future conditions and planned accordingly.</p>
<p>The idea of analogs was first applied to NWP by <xref ref-type="bibr" rid="B57">Lorenz (1969)</xref>, who suggested that two similar states of the atmosphere could be considered estimates of the same atmosphere, but with a different error super imposed. <xref ref-type="bibr" rid="B57">Lorenz (1969)</xref> exploited this idea and analysed the evolution of similar states of the atmosphere to understand predictability and error growth rates in weather forecasts.</p>
<p>Analog forecasting, sometimes referred to as reforcasting (e.g., <xref ref-type="bibr" rid="B40">Hamill et&#xa0;al., 2006</xref>) or model-analog forecasting (e.g., <xref ref-type="bibr" rid="B30">Ding et&#xa0;al., 2020</xref>), has been used for seasonal prediction (e.g., <xref ref-type="bibr" rid="B29">Ding et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B102">Walsh et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B1">Acosta Navarro et&#xa0;al., 2025</xref>), long-range weather forecasting (e.g., <xref ref-type="bibr" rid="B10">Bergen and Harnack, 1982</xref>), and NWP (e.g., <xref ref-type="bibr" rid="B25">Delle Monache et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B5">Bagtasa, 2021</xref>). However, most weather centres have abandoned analog forecasting, noting challenges in finding useful analogs (e.g., <xref ref-type="bibr" rid="B100">Van den Dool, 2007</xref>). Moreover, it is widely acknowledged that for NWP, analogs diverge sufficiently rapidly that dynamical forecasts outperform analog forecasts (e.g., <xref ref-type="bibr" rid="B102">Walsh et&#xa0;al., 2021</xref>). However, ocean time-scales are generally longer than atmospheric time-scales, and the skill of ocean forecast systems is still relatively poor (e.g., <xref ref-type="bibr" rid="B87">Rykova, 2023</xref>). It&#x2019;s therefore possible that the analog forecasting may be suitable for ocean forecasting, and that with the emergence of &#x201c;big data&#x201d; and with careful application, analog forecasting may become useful for mainstream or niche ocean prediction (e.g., prediction of oil spill trajectories or phytoplankton blooms).</p>
<p>The principles behind analog forecasting also underpin ensemble prediction (e.g., <xref ref-type="bibr" rid="B45">Houtekamer and Derome, 1995</xref>), where a number of forecasts are performed with the intention of spanning the full range of possible future conditions, given the current state and the uncertainty associated with its estimation. For ensemble prediction, each ensemble member could be considered an analog of the current state, with the ensemble mean representing the most likely state, and anomalies from the ensemble mean used to underpin data assimilation.</p>
<p>In the fields of machine learning and data mining, a widely-used method that is similar to analog forecasting is called k-Nearest Neighbours (kNN; e.g., <xref ref-type="bibr" rid="B34">Fix and Hodges, 1951</xref>; <xref ref-type="bibr" rid="B22">Cover and Hart, 1967</xref>; <xref ref-type="bibr" rid="B26">Deng et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B108">Zhang et&#xa0;al., 2017</xref>). kNN is mostly used as a clustering and classification algorithms that is applied to many different fields, including healthcare (e.g., <xref ref-type="bibr" rid="B106">Xing and Bei, 2019</xref>), finance (e.g., <xref ref-type="bibr" rid="B46">Imandoust et&#xa0;al., 2013</xref>), and facial recognition (e.g., <xref ref-type="bibr" rid="B103">Wang and Li, 2022</xref>). The idea behind kNN is that a given data point can be classified or predicted based on the characteristics of its <italic>k</italic> most similar neighbours in some relevant sub-space, where <italic>k</italic> is an integer (analogous to ensemble size). We extend the analog forecasting framework by incorporating a kNN approach to generate an ensemble of regional SLA forecasts. A similar approach was applied by <xref ref-type="bibr" rid="B31">Eckel and Delle Monache (2016)</xref> for NWP, showing that the hybrid analog ensemble approach outperformed traditional forecast systems at that time.</p>
<p>The key idea is to objectively identify an ensemble of past ocean states that resemble current conditions. The subsequent evolution of these historical analogs provides an ensemble of forecasts. When analogs identified are from an archive of free-running models with no data assimilation, then the assembled forecasts are dynamically consistent. Here, we regard a state as dynamically consistent if it is a solution to the model equations. By maintaining dynamical consistency, initialisation shock is eliminated. Here we show that analog forecasting can produce forecasts with more skill than traditional systems, and can be produced at a fraction of the computational cost.</p>
<p>The data sets used in the study are described in section 2, the methodology is presented in section 3, and the results are in section 4. We include a discussion in section 5, the psuedo-code for our system in section 6, followed by our conclusions in section 7.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Data</title>
<sec id="s2_1">
<label>2.1</label>
<title>Observations</title>
<p>The observations that underpin the system presented here include along-track satellite altimetry from the Radar Altimeter Database System (RADS, <xref ref-type="bibr" rid="B93">Scharroo et&#xa0;al., 2013</xref>). The along-track data is corrected for various geophysical and instrumental effects (<xref ref-type="bibr" rid="B92">Scharroo, 2018</xref>), including the effects of atmospheric pressure. Additionally, the sea-level observations are converted to SLA by removing an appropriate mean sea surface height. The experiments presented here span 2023, when altimeter data is available from six altimeter missions, including Sentinel-3A, -3B, and -6A, SARAL/Altika, Jason-3, and Cryosat-2. The altimeter data analysed in this study have a sampling frequency of 1 Hz, which translates to a spatial resolution of roughly 7 km along-track. The repeat cycle for Sentinel-3A and -3B is 27 days; for Sentinel-6A and Jason-3 is 10 days; and for SARAL/AltiKa is 35 days; while CryoSat-2 has no exact repeat cycle.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>SLA archive</title>
<p>The gridded SLA fields used as an archive for our system are from many different sources. The archive of states from which analogs are identified is sometimes called a catalogue (e.g., <xref ref-type="bibr" rid="B80">Platzer and Chapron, 2024</xref>) or a library (e.g., <xref ref-type="bibr" rid="B29">Ding et&#xa0;al., 2018</xref>). This includes many different models, namely version 3 and version 4 of the Ocean Forecasting Australia Model (OFAM, <xref ref-type="bibr" rid="B75">Oke et&#xa0;al., 2013</xref>), version 3 of the LASG/IAP Climate System Ocean Model (LICOM3, <xref ref-type="bibr" rid="B28">Ding et&#xa0;al., 2022</xref>), the 0.1<sup>&#x25e6;</sup>-resolution version of the Australian Community Climate and Earth System Simulator Ocean Model (ACCESS-OM2-01, <xref ref-type="bibr" rid="B50">Kiss et&#xa0;al., 2020</xref>), and the Ocean general circulation mode For Earth Simulations (OFES, <xref ref-type="bibr" rid="B63">Masumoto et&#xa0;al., 2004</xref>). Relevant details of the specific model runs are summarised in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>. All of the models used here are based on either version 3 or 4 of the Modular Ocean Model (MOM, <xref ref-type="bibr" rid="B36">Griffies, 2009</xref>). Model runs are forced with atmospheric fields from JRA55 (<xref ref-type="bibr" rid="B52">Kobayashi et&#xa0;al., 2015</xref>), ERA-Interim (<xref ref-type="bibr" rid="B24">Dee and Uppala, 2009</xref>), ERA-20C (<xref ref-type="bibr" rid="B81">Poli et&#xa0;al., 2016</xref>), NCEP (<xref ref-type="bibr" rid="B48">Kalnay and Kanamitsu, 1996</xref>), or a 17-member ensemble-mean CMIP5-RCP8.5 (e.g., <xref ref-type="bibr" rid="B49">Kharin et&#xa0;al., 2013</xref>). The horizontal resolution for all models is 0.1<sup>&#x25e6;</sup>, although the data from C100 (using LICOM3.0) are only freely available at 0.25<sup>&#x25e6;</sup>-resolution. Importantly, all model runs provide daily-averaged SLA fields. Some models report sea-level that includes the impact of atmospheric pressure. For these elements of the archive, an inverse barometer correction has been applied.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Summary of the model runs used in this study.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Abbrev.</th>
<th valign="middle" align="center">Run type</th>
<th valign="middle" align="center">Model</th>
<th valign="middle" align="center">Config.</th>
<th valign="middle" align="center">Res.</th>
<th valign="middle" align="center">Forcing</th>
<th valign="middle" align="center">Duration</th>
<th valign="middle" align="left">Reference</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">EISP JRSP</td>
<td valign="middle" align="center">IAF</td>
<td valign="middle" align="center">MOM4</td>
<td valign="middle" align="center">OFAM</td>
<td valign="middle" align="center">0.1<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">ERA-Interim JRA55</td>
<td valign="middle" align="center">1979-2014 (36 years)<break/>1993-2012 (20 years)</td>
<td valign="middle" align="left"><xref ref-type="bibr" rid="B75">Oke et&#xa0;al. (2013)</xref></td>
</tr>
<tr>
<td valign="middle" align="left">Y79R<break/>CM85</td>
<td valign="middle" align="center">RYF IAF</td>
<td valign="middle" align="center">MOM4</td>
<td valign="middle" align="center">OFAM</td>
<td valign="middle" align="center">0.1<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">JRA55&#x2013;1979 CMIP5</td>
<td valign="middle" align="center">123 years<break/>2006-2101 (96 years)</td>
<td valign="middle" align="left"><xref ref-type="bibr" rid="B109">Zhang et&#xa0;al. (2016)</xref></td>
</tr>
<tr>
<td valign="middle" align="left">BR20<break/>BR23</td>
<td valign="middle" align="center">RA</td>
<td valign="middle" align="center">MOM4<break/>+EnOI</td>
<td valign="middle" align="center">OFAM</td>
<td valign="middle" align="center">0.1<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">JRA55<break/>ERA-Interim</td>
<td valign="middle" align="center">1993-2022 (30 years)<break/>2010-2022 (13 years)</td>
<td valign="middle" align="left"><xref ref-type="bibr" rid="B17">Chamberlain et&#xa0;al. (2021b)</xref></td>
</tr>
<tr>
<td valign="middle" align="left">OCUR SSDU</td>
<td valign="middle" align="center">OA</td>
<td valign="middle" align="center">OI</td>
<td valign="middle" align="center">DM02<break/>vNov2024</td>
<td valign="middle" align="center">0.2<sup>&#x25e6;</sup><break/>0.125<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">n/a<break/>n/a</td>
<td valign="middle" align="center">1993-2020 (28 years)<break/>1993-2022 (30 years)</td>
<td valign="middle" align="left">IMOS <break/>CMEMS</td>
</tr>
<tr>
<td valign="middle" align="left">C100</td>
<td valign="middle" align="center">IAF</td>
<td valign="middle" align="center">MOM3</td>
<td valign="middle" align="center">LICOM3.0</td>
<td valign="middle" align="center">0.25<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">ERA-20C</td>
<td valign="middle" align="center">1901-2010 (110 years)</td>
<td valign="middle" align="left"><xref ref-type="bibr" rid="B28">Ding et&#xa0;al. (2022)</xref></td>
</tr>
<tr>
<td valign="middle" align="left">AOM1<break/>AOM2<break/>AOM3<break/>AOM4</td>
<td valign="middle" align="center">IAF</td>
<td valign="middle" align="center">MOM4</td>
<td valign="middle" align="center">A-OM2-01</td>
<td valign="middle" align="center">0.1<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">JRA55-do</td>
<td valign="middle" align="center">1958-2018 (61 years)</td>
<td valign="middle" align="left"><xref ref-type="bibr" rid="B50">Kiss et&#xa0;al. (2020)</xref></td>
</tr>
<tr>
<td valign="middle" align="left">AOMR</td>
<td valign="middle" align="center">RYF</td>
<td valign="middle" align="center">MOM4</td>
<td valign="middle" align="center">AOM2-01</td>
<td valign="middle" align="center">0.1<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">JRA55 1990</td>
<td valign="middle" align="center">231 years</td>
<td valign="middle" align="left"><xref ref-type="bibr" rid="B98">Stewart et&#xa0;al. (2020)</xref></td>
</tr>
<tr>
<td valign="middle" align="left">OFSC</td>
<td valign="middle" align="center">CLIM</td>
<td valign="middle" align="center">MOM3</td>
<td valign="middle" align="center">OFES1</td>
<td valign="middle" align="center">0.1<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">NCEP repeat</td>
<td valign="middle" align="center">8 years</td>
<td valign="middle" align="left"><xref ref-type="bibr" rid="B63">Masumoto et&#xa0;al. (2004)</xref></td>
</tr>
<tr>
<td valign="middle" align="left">OFSJ</td>
<td valign="middle" align="center">IAF</td>
<td valign="middle" align="center">MOM3</td>
<td valign="middle" align="center">OFES2</td>
<td valign="middle" align="center">0.1<sup>&#x25e6;</sup></td>
<td valign="middle" align="center">JRA55-do</td>
<td valign="middle" align="center">1990&#x2013;2023 (34 years)</td>
<td valign="middle" align="left"><xref ref-type="bibr" rid="B91">Sasaki et&#xa0;al. (2020)</xref></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Run types include Interannual Forcing (IAF) with realistic year-to-year variability; Repeat-Year Forcing (RYF) with a fixed annual cycle from one year; Climatological Forcing (CLIM), with a smoothed seasonal cycle; data-assimilating reanalyses (RA), and Observation-based analyses (OA). The IAF runs using ACCESS-OM2-01 (A-OM2-01) include four cycles (AOM1-4).</p></fn>
</table-wrap-foot>
</table-wrap>
<p>The model runs included in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref> are a mix of standard model integrations, with realistic interannual forcing (IAF) and some are model simulations with repeat year forcing (RYF). Of the RYF runs, Y79R is a 123-year model run with repeat-year forcing from 1979 (<xref ref-type="bibr" rid="B109">Zhang et&#xa0;al., 2016</xref>); AOMR is a 230-year model run with repeat-year forcing from 1990/1991 (<xref ref-type="bibr" rid="B98">Stewart et&#xa0;al., 2020</xref>); and OFSC is an 8-year model run with climatological forcing fields from an NCEP reanalysis (<xref ref-type="bibr" rid="B63">Masumoto et&#xa0;al., 2004</xref>). The runs with ACCESS-OM2-01 (AOM1, AOM2, AOM3, and AOM4) are IAF runs, but include four cycles, each spanning 61 years, with forcing from JRA-55 (<xref ref-type="bibr" rid="B50">Kiss et&#xa0;al., 2020</xref>).</p>
<p>In addition to data from model runs, for some experiments, we also use data from ocean reanalysis (RA) and ocean analysis (OA) products. The RA data sets include two versions of the Bluelink ReANalysis (BRAN) - version 2020 (BR20; <xref ref-type="bibr" rid="B17">Chamberlain et&#xa0;al., 2021b</xref>, <xref ref-type="bibr" rid="B16">a</xref>) and version 2023 (BR23; which includes incremental improvements compared to BRAN2020). The OA products are both global gridded estimates of SLA, produced using optimal interpolation. These include IMOS Ocean Current (OCUR; <ext-link ext-link-type="uri" xlink:href="http://oceancurrent.imos.org.au">http://oceancurrent.imos.org.au</ext-link>) and Ssalto/DUACS (SSDU), produced under Copernicus Marine Environment Monitoring Service (CMEMS; <ext-link ext-link-type="uri" xlink:href="https://marine.copernicus.eu">https://marine.copernicus.eu</ext-link>).OceanCurrent is a 0.2<sup>&#x25e6;</sup>-resolution product, and Ssalto/DUACS is a 0.125<sup>&#x25e6;</sup>-resolution product. The RA and OA products all span 2023 - which is the test period for this study. When part of the archive, gridded fields after September 2022 are excluded from the archive to ensure a &#x201c;fair&#x201d; assessment of the analog forecasts.</p>
<p>For this study, we assemble a global archive of daily SLA fields. This permits efficient application to any region of the world. However, to assess the system, we produce forecasts of SLA for 12 regional domains around Australia (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>). Each domain spans 5x5<sup>&#x25e6;</sup> &#x2013; approximately 500x500 km at 30<sup>&#x25e6;</sup>S &#x2013; and includes a range of dynamic regimes, including western and eastern boundary currents, eddy-rich fields, and wind-driven regions in both tropical and mid-latitude zones.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Map of the domains around Australia and New Zealand that are used to test analog forecasts.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g001.tif">
<alt-text content-type="machine-generated">Map of the Southwest Pacific and surrounding regions showing numbered boxes indicating specific locations. The locations include EAC, Lord Howe Island, EAC Eddy, Tasmania, Coral Sea, New Caledonia, Bay of Plenty, Lombok, Christmas Island, Ningaloo, Perth, and GAB. Each box corresponds to these names as listed in the legend. Latitude and longitude lines provide geographical reference.</alt-text>
</graphic></fig>
<p>The most computationally intensive step in our system is reading the archived data into memory. This is made more efficient by &#x201c;cutting out&#x201d; regional subsets of each model in advance for each domain.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Analysis of the model archive</title>
<p>As noted in the introduction, most NWP centres have abandoned analog forecasting, citing the difficulty finding &#x201c;good analogs&#x201d;. Here, we use data from many different sources, hoping to expand the catalogue of states from which analogs can be identified. The full aggregated archive of states is assembled from 16 different model runs or analysis products (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>) from over 1000 years of data. To evaluate how data from additional sources contribute independent information to the archive, we perform a singular value decomposition (SVD) on various subsets of the archived fields. We analyse data from Region 1, which we assume to be representative of other regions. We perform the SVD for each model run or analysis product individually; and we also calculate the SVD for aggregated archives, starting with a single model run (m=1) and progressively including data from additional model runs and analysis products, up to m=16.</p>
<p>Since the square of each singular value of a data matrix is proportional to the variance explained by its corresponding mode, the singular value spectrum shows how the effective dimension of the state space changes with the addition of each new source of SLA data. To prevent artificial inflation of the variance due to increasing sample size, we normalise each data matrix by <inline-formula>
<mml:math display="inline" id="im1"><mml:mrow><mml:mn>1</mml:mn><mml:mo stretchy="false">/</mml:mo><mml:msqrt><mml:mi>n</mml:mi></mml:msqrt></mml:mrow></mml:math></inline-formula>, where <italic>n</italic> is the number of daily fields in the archive. This normalisation ensures that increases in singular values truly reflect new patterns of variability, not simply more data. When a new dataset contributes no independent information, its addition doesn&#x2019;t change the singular values; and the data from the new source merely projects onto existing modes. By contrast, an increase in singular values indicates an increase in the effective dimension of the subspace spanned by the archive.</p>
<p>Results are presented in <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>, showing the spectra of singular values for: (a) all OFAM runs, (b) both ocean analyses, (c) all ACCESS-OM2&#x2013;01 runs, and (d) all model runs and analyses listed in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>. In <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2a</bold></xref>, although six OFAM runs are included, they fall into three distinct groups with independent variability: the ERA-Interim&#x2013;forced run (EISP), the JRA-55&#x2013;forced runs (JRSP, Y79R), and the reanalyses (BR20, BR23). We find that CM85 adds no new dimensions on top of EISP, JRSP, and Y79R. We also see that both reanalyses (BR20 and BR23) project onto equivalent modes, together increasing the overall dimension of the archived dataset.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Spectrum of singular values, plotted on a log-scale, using aggregated data from 1 up to 16 model runs (for region 1), for <bold>(a)</bold> OFAM-based runs, <bold>(b)</bold> observation-based analyses, <bold>(c)</bold> ACCESS-OM2&#x2013;01 based runs, and <bold>(d)</bold> all runs/analyses.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g002.tif">
<alt-text content-type="machine-generated">Four line charts display singular values against modes across different panels: (a) OFAM, (b) OA, (c) AOM*, and (d) ALL. Each chart includes multiple colored lines representing various datasets, identified by legends indicating years and labels, such as EISP, JRSP, Y79R, and others. The x-axis shows the mode from zero to one thousand, and the y-axis is logarithmic from one to ten to the power of negative three.</alt-text>
</graphic></fig>
<p>The two observation-based ocean analyses (OCUR and SSDU; <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2b</bold></xref>) contribute distinct modes, likely due to differences in gridding methods and spatial resolution. All of the ACCESS-OM2&#x2013;01 runs (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2c</bold></xref>) project onto the same subspace; and data from the OFES model introduces new, independent variability (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2d</bold></xref>), despite the shorter duration of those runs. We find that the C100 dataset, generated using LICOM3.0, also contributes unique modes, expanding the effective dimension of the archive.</p>
<p>Based on analysis of singular values (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>), we conclude that multiple runs from the same model configuration generally span the same subspace. Consequently, adding more runs from the same configuration does not increase the effective dimensionality of the archive. To further explore the contribution of information to the aggregated dataset, we also examine the associated singular vectors.</p>
<p>We find that the right singular vectors, representing the dominant spatial modes, are effectively equivalent across all runs from the same model configuration (though the exact order of modes and the details are not precisely the same). This confirms that these runs share the same underlying spatial structures - consistent with the analysis of singular values. By contrast, the left singular vectors, representing the temporal variability, are uncorrelated across different runs - even for the repeat cycles of AOM* that span the same time periods and forced with the same fluxes. This indicates that while each run projects onto the same set of spatial modes, the combination and weighting of those modes varies in time for different runs.</p>
<p>The implication of this result is important: although the spatial subspace is unchanged, each new run contributes a unique combination of modes. As a result, the full set of archived fields becomes richer in its diversity of states. For analog forecasting, this means that adding more runs - even from the same model - broadens the catalogue of historical states that can be searched for analogs, increasing the likelihood of identifying a close match to the observed state.</p>
<p>This finding is consistent with a well-known property of high-dimensional spaces - that independently drawn random vectors from a high-dimensional state are likely to be nearly orthogonal (<xref ref-type="bibr" rid="B19">Christiansen, 2018</xref>). It is also supported by our sensitivity experiments that show that forecast skill consistently improves as more runs are included in the archive.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Benchmark dataset</title>
<p>To benchmark the skill of our analog forecasting system, we compare its predictions against archived forecasts from OceanMAPS version 4.0i (OMv4.0i; <xref ref-type="bibr" rid="B12">Brassington et&#xa0;al., 2023</xref>), accessed as they were available at the time of each forecast (last retrieved 14 February 2025). OMv4.0i is a traditional ocean forecast system that uses a hybrid-EnKF data assimilation system to initialise a near-global ocean general circulation model (OFAM). OMv4.0i uses a 48-member dynamic ensemble and a 144-member stationary ensemble, similar to <xref ref-type="bibr" rid="B21">Counillon et&#xa0;al. (2009)</xref>. This approach to data assimilation combines the Ensemble Kalman Filter (<xref ref-type="bibr" rid="B32">Evensen, 2003</xref>) and Ensemble Optimal Interpolation (<xref ref-type="bibr" rid="B71">Oke et&#xa0;al., 2002b</xref>; <xref ref-type="bibr" rid="B32">Evensen, 2003</xref>; <xref ref-type="bibr" rid="B73">Oke et&#xa0;al., 2010</xref>) for estimating the system&#x2019;s background error covariance. OMv4.0i produces forecasts that are of comparable performance to other operational systems run around the world (e.g., <xref ref-type="bibr" rid="B3">Aijaz et&#xa0;al., 2023</xref>) and are significantly better than version 3 of the same system that preceded it (<xref ref-type="bibr" rid="B12">Brassington et&#xa0;al., 2023</xref>).</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Validation dataset</title>
<p>To independently assess each forecast produced here, we compare forecast SLA fields to a verifying analyses from IMOS OceanCurrent (<ext-link ext-link-type="uri" xlink:href="http://oceancurrent.imos.org.au">http://oceancurrent.imos.org.au</ext-link>, last accessed on 14 February 2025). SLA analyses from OceanCurrent are available on a 0.2<sup>&#x25e6;</sup>-resolution grid, with analyses every day. OceanCurrent analyses are produced by merging along-track SLA from all available satellite altimeter missions together with SLA observations from coastal tide gauges around Australia using optimal interpolation.</p>
</sec>
</sec>
<sec id="s3">
<label>3</label>
<title>Method</title>
<p>Here, we develop a simple analog forecast system to predict SLA for a regional domain to quantify the mesoscale ocean circulation. The inputs required for this approach include an estimate of the current state of the ocean, and an archive of past or simulated ocean states. The system identifies the instance in the archive that is most similar to the current state. This instance is considered an &#x201c;analog&#x201d;, and the sequence of archived fields immediately following the identified analog is assembled as a forecast.</p>
<p>With some exceptions (e.g., <xref ref-type="bibr" rid="B25">Delle Monache et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B47">Junk et&#xa0;al., 2015</xref>), most analog forecasting systems identify a single forecast. Here, we extend this approach by identifying an ensemble of analogs, each representing a possible evolution of the ocean. We analyse the forecasts from each individual analog, as well as their ensemble mean. This is conceptually similar to kNN (e.g., <xref ref-type="bibr" rid="B34">Fix and Hodges, 1951</xref>; <xref ref-type="bibr" rid="B22">Cover and Hart, 1967</xref>), which often involves weighted ensemble averaging (e.g., <xref ref-type="bibr" rid="B37">Gul et&#xa0;al., 2022</xref>). Several other studies have used analog forecasting with a modified kNN approach to produce tailored weather forecasts (e.g., <xref ref-type="bibr" rid="B9">Bannayan and Hoogenboom, 2008</xref>; <xref ref-type="bibr" rid="B38">Hall et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B105">Xie et&#xa0;al., 2024</xref>). For the remainder of this study, we refer to each analog (ensemble member) as a nearest neighbour (NN).</p>
<p>Each NN is identified using an objective similarity metric between the observed ocean state and archived fields. Common metrics include anomaly cross-correlation (ACC) and mean absolute difference (MAD). For the application presented here we prefer using ACC as the metric for calculating similarity and have used this as the default for calculations presented in this study. The archive of past states may be sourced from a single long model run (e.g., <xref ref-type="bibr" rid="B50">Kiss et&#xa0;al., 2020</xref>), a reanalysis (e.g., <xref ref-type="bibr" rid="B17">Chamberlain et&#xa0;al., 2021b</xref>), or observation-based analyses (e.g., <xref ref-type="bibr" rid="B6">Ballarotta et&#xa0;al., 2025</xref>). Many analog forecasting studies use data from a single reanalysis or model run. However, to ensure dynamically consistent forecasts, most of the results presented in this study only use fields from free-running model simulations without data assimilation (a subset of runs listed in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref> - only those with run types of IAF, RYF, of CLIM; referred to below as Experiment 1).</p>
<p>The present ocean state is defined using satellite altimetry-derived SLA observations, which effectively capture the boundary currents and mesoscale features, such as eddies and fronts. For most experiments reported here, we use SLA data over a 10-day period, instead of just a single-day of observations. We compare the most recent 10-day evolution of SLA, relative to the analysis time (t=0), to archived sequences of the same length. This allows the system to identify analogs that best match the recent temporal variability of mesoscale ocean, an approach that is similar to Local Dynamic Analog forecasting in NWP (<xref ref-type="bibr" rid="B44">Hou et&#xa0;al., 2021</xref>).</p>
<p><xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref> illustrates this approach. The top row shows along-track SLA observations over a 10-day period. The second row presents an archive of SLA fields from a model run. The lower rows display model fields interpolated to the observation locations (using bi-linear interpolation) for each 10-day period in the archive. The MAD is computed for each sample, and the sequence with the smallest MAD is selected as the NN (i.e., the best analog). The forecast SLA is then assembled from the model fields immediately following the NN period. While <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref> uses MAD for NN identification, ACC can also be used, and in most cases, both metrics yield similar results.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Illustration of how the analog forecast system quantifies the mean absolute difference (MAD) between a 10-day sequence of along-track altimeter observations (OBS, top row) and every 10-day sequence in the training dataset (Train, second row). The number in each panel of the Train row indicates the corresponding day in the training dataset. In the OBS row, each dot represents an observation location, with its colour indicating the observed SLA, ranging from -0.5 m (red) to 0.5 m (blue), with white representing zero. In the Test1, Test2, etc., rows, the colour of each dot represents the SLA value at the observation locations from the corresponding sequence in the training dataset. For clarity, fields for Test8&#x2013;Test16 are not shown. This demonstration uses a simplified training dataset of only 30 days, whereas the experiments presented in this study utilise a much larger dataset spanning over 1000 years of daily SLA fields. The NN is identified as the 10-day sequence in the training dataset with the smallest MAD. In this example, for a 5<sup>&#x25e6;</sup> &#xd7; 5<sup>&#x25e6;</sup> region off south-eastern Australia, the NN corresponds to Test5, with an MAD of 0.06655 m. This sequence consists of SLA fields from days 5 to 14 in the training dataset. The associated 15-day SLA &#x201c;forecast&#x201d; is then derived from the SLA fields immediately following day 14 (i.e., days 15&#x2013;29 in the training dataset).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g003.tif">
<alt-text content-type="machine-generated">A series of stacked line graphs compare observations, training, and various test results labeled Test1 through Test21. Each graph includes multiple colored lines, with Mean Absolute Deviation (MAD) values indicated next to each test result, ranging from 0.06655 meters to 0.12713 meters. The graphs visually depict different scenarios or iterations, highlighting variance across tests.</alt-text>
</graphic></fig>
<p><xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref> provides a more detailed example of how analog forecasting is used to assemble a forecast of SLA after the NN is identified. Again, the top row of <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref> shows observations over a 10-day period. The second row shows the SLA fields for the first NN. The third row presents model fields interpolated to observation locations &#x2013; intended to demonstrate the consistency between the observed and archived SLA. The bottom row of <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref> displays a forecast for SLA that follows the last day of the NN period.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Demonstration of how a selected NN is used to produce a forecast. The top row (a1-j1) shows along-track altimeter data that is used to assess each potential neighbour, where the location of each dot denotes the location of an observation, and the colour of each dot indicated the value of the SLA observation. The second row (a2-j2) shows SLA from the archive for the first NN for the 10-day time-window that is identified to &#x201c;fit&#x201d; the observations most closely (for this example, the MAD of the NN is 0.0617 m and the ACC of 0.83). The third row (a3-j3) shows the modelled SLA fields interpolated to the observation locations (in time and space) &#x2013; to qualitatively demonstrate the level of agreement with the observations. The bottom row (a4-j4) shows SLA for 10 days after the period selected period for the first NN &#x2013; interpreted here as a 10-day forecast. This example is for a domain off south-eastern Australia, showing SLA with a range of -0.5 (blue) to 0.5 m (red), where zero is white.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g004.tif">
<alt-text content-type="machine-generated">Panels illustrate data comparisons across different methods and timeframes with color gradients representing intensity. Observed data ("OBS") are at the top, followed by neural network training ("NN1 (train)"), interpolation ("NN1 (interp)"), and prediction ("NN1 (predict)") results. Each method contrasts changes over time from t=&#x2212;9 to t=+10.</alt-text>
</graphic></fig>
<p>In our experiments, we use an extensive archive of up to 365,502 daily SLA fields, compiled from up to 16 different sources spanning over 1000 years (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). To ensure independence of each NN (each ensemble member), we apply the following selection process. First, we identify the &#x201c;best&#x201d; NN (NN1) - the NN with the highest ACC compared to along-track SLA. Second, we exclude all archived states within 45 days before and after NN1. Third, we identify the next best NN (NN2) and repeat until 12 NNs are selected (the choice of 12 is justified below). We&#x2019;re also careful to exclude NN periods at the end of each model run, to avoid assembling a forecast that spans two different model runs. This process allows us to efficiently construct ensemble-based forecasts that are dynamically consistent and free from initialisation shock.</p>
<p>To evaluate the significance of the identified NNs - that is, whether the identified NNs are meaningfully distinguishable from other fields in the archive - we analyse a frequency histogram of the MAD for each 10-day period within a single forecast across six domains (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>). For some domains, the histogram resembles a Gaussian distribution, while others show a skewed Gaussian shape. Some domains, such as Regions 1 and 5 have quite a long tail, suggesting that the identified NNs are truly distinct from other fields in the archive; while others, such as Regions 3 and 9, have a short tail for small values of MAD, suggesting that the NNs are not particularly distinct from many other samples in the archive.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Frequency histograms of MAD for each 10-day sample tested by the kNN algorithm for an example forecast  in six different domains, labelled in each panel <bold>(a-f)</bold>. The NNs correspond to samples with the smallest MAD. Panel <bold>(a)</bold> shows the example represented in <xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>. A larger tail implies more distinct NNs, compared to a random sample.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g005.tif">
<alt-text content-type="machine-generated">Six histograms display the frequency distribution of Mean Absolute Deviation (MAD) in meters for different regions: (a) Region 1, (b) Region 3, (c) Region 5, (d) Region 7, (e) Region 9, and (f) Region 11. Each histogram varies in skewness and spread, illustrating distinct characteristics of MAD across these regions.</alt-text>
</graphic></fig>
</sec>
<sec id="s4" sec-type="results">
<label>4</label>
<title>Results</title>
<sec id="s4_1">
<label>4.1</label>
<title>Experiment design</title>
<p>To evaluate our system, we conduct 25 independent 15-day forecasts, initialised every 15 days throughout 2023. These forecasts span 12 regional domains around Australia (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>), encompassing a range of dynamic regimes. Most results presented here are from Experiment 1 (Exp. 1), which uses sea level anomaly (SLA) fields from the free-running models listed in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref> - EISP, JRSP, Y79R, C100, AOM*, and OFS* - comprising a total of 902 years of daily SLA data.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Statistical assessment</title>
<p><xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6</bold></xref>, <xref ref-type="fig" rid="f7"><bold>7</bold></xref> summarise the system performance across all domains. <xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref> compares MAD between SLA in the verifying analysis and forecasts from three sources, including the kNN-based equal-weighted ensemble mean (kNN EqW); OceanMAPS version 4.0i (OMv4.0i); and the first nearest neighbour (NN1). <xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref> shows an equivalent analysis, but using ACC to evaluate forecasts.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Plots showing the MAD between a verifying SLA analysis (from OceanCurrent) and predicted SLA from the ensemble mean of 12 NNs (kNN EqW, blue), OceanMAPSv4 (OMv4.0i, red), and the first NN (NN1, orange) for 12 different regions (smaller MAD is better), labelled in each panel <bold>(a-l)</bold>. Each panel shows the average MAD as a function of lead time, averaged over 25 independent forecasts starting 15 days apart during 2023. Shaded areas denote the error of the mean metrics. Each panel also shows the p-value for the comparison between the forecast from either kNN EqW or NN1 (whichever is smallest) and OMv4.0i (averaged over days 1-6) and the next smallest. A p-value below 0.05 indicates that such a difference would occur by chance less than 5% of the time under the null hypothesis of equal performance. The location of each domain is indicated by the region number, referenced to the map at the top left and in <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>. Boxes with p-values below 0.05 are coloured according to the forecast system that exhibited statistically significant superior performance, while grey boxes indicate domains where the mean metrics are statistically equivalent. Overall, the kNN forecasts (either kNN EqW or NN1) produced significantly smaller MAD for 5 of 12 domains, whereas OMv4.0i gave the best forecasts for 3 of 12 domains.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g006.tif">
<alt-text content-type="machine-generated">Line graphs showing Mean Absolute Deviation (MAD) in meters across twelve regions in Australia, with lead times from 0 to 15 days. Three methods&#x2014;kNN EqW (blue), OMv4.0i (red), and NN1 (yellow)&#x2014;are compared. Each graph includes a p-value indicating statistical significance. Regions are labeled a-l, with diverse trends observed in MAD over time.</alt-text>
</graphic></fig>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p><bold>(a-l)</bold> As for <xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>, but showing ACC between a verifying SLA analysis and predicted SLA (larger values indicate better performance). Overall, kNN forecasts (either kNN EqW or NN1) yielded higher ACC in 7 of 12 domains; OMv4.0i was clearly best in 1 domain; and the mean ACC wasn&#x2019;t statistically different for 4 domains, with a high chance that the differences could occur by chance.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g007.tif">
<alt-text content-type="machine-generated">Map and graphs showing prediction accuracy across 12 Australian regions. Each graph compares three forecasting models: kNN EqW (blue), OMv4.0i (red), and NN1 (yellow), with ACC plotted against lead time in days. Statistical significance is indicated by p-values for each region.</alt-text>
</graphic></fig>
<p>For <xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6</bold></xref>, <xref ref-type="fig" rid="f7"><bold>7</bold></xref>, we show the mean metrics computed from 25 forecasts. The shaded bands represent the standard error of the mean across those forecasts, and the associated p-values are also reported in each panel. To identify the &#x201c;best&#x201d; forecast performance for each region, we compare the metrics (averaged over forecast days 1-6 - limited to 6-day forecasts because that is available from OMv4.0i) between three forecast types: kNN EqW, OMv4.0i, and NN1.</p>
<p>For each pairwise comparison, the null hypothesis is that the two forecast methods have equal mean performance. We evaluate this hypothesis using a standard two-sample t-test (e.g., <xref ref-type="bibr" rid="B13">Browne, 2010</xref>) applied to the distribution of metrics across the 25 forecasts. A p-value (e.g., <xref ref-type="bibr" rid="B101">Vidgen and Yasseri, 2016</xref>) below 0.05 indicates that the observed difference in mean metrics would occur by chance less than 5% of the time under the null hypothesis. When the p-value is below this threshold, we regard the difference between forecast methods as statistically significant.</p>
<p>For regions where one forecast type significantly outperforms the benchmark &#x2013; or where the benchmark significantly outperforms the kNN-based forecasts &#x2013; we denote the region with a coloured box in <xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6</bold></xref>, <xref ref-type="fig" rid="f7"><bold>7</bold></xref>.</p>
<p>Using MAD as a metric, kNN EqW outperforms OMv4.0i in 4 of 12 domains, NN1 outperforms OMv4.0i in 1 of 12 domains, and OMv4.0i outperforms the kNN-based forecasts for 3 of 12 domains (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>). For 3 of 12 domains, the mean MAD are not significantly different.</p>
<p>Using ACC, kNN EqW outperforms OMv4.0i in 6 of 12 domains; NN1 outperforms OMv4.0i in 1 of 12 domains, and OMv4.0i outperforms the kNN-based forecasts in 1 of 12 domains (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>). For 4 of 12 domains, the mean ACC are not significantly different.</p>
<p>Based on these results, we conclude that the kNN/analog system outperforms traditional operational forecasts in 40-60% of cases, performs equally well (no statistical difference) in about 30% of cases, and is outperformed in about 10-25% of cases.</p>
<p>A distinct feature of OMv4.0i forecasts is a sharp increase in MAD and drop in ACC between days 0 and 1 (<xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6</bold></xref>, <xref ref-type="fig" rid="f7"><bold>7</bold></xref>). We attribute this to initialisation issues that are caused by the dynamically inconsistent initial conditions, as noted in the introduction. By contrast, analog forecasts avoid such degradation since each forecast is from a free-running model, and is therefore dynamically consistent.</p>
<p>It is interesting to note the relative number of NNs that are identified from each source in the assembled archive (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>). In total, we identify 3600 NNs for this study, comprised of an ensemble of 12 for 25 forecasts over 12 domains. We report results from two configurations: Exp. 1, where only dynamically consistent SLA fields are used (from EISP, JRSP, Y79R, CM85, C100, AOM*, and OFS*); and Exp. 17, using all data in the archive (the same as Exp. 1, plus BR20, BR23, OCUR, and SSDU). For Exp. 1, we find that there is a disproportionally high number of NNs from AOM* IAF runs &#x2013; accounting for 38.1% of NNs in Exp. 1, having contributed 30.3% of the archive. For Exp.17, when we include ocean reanalyses and observation-based analyses in the archive, this weighting towards the AOM* IAF runs reduces, and the observation-based analyses contribute a disproportionally large percentage of NNs. Together, OCUR and SSDU account for 11.5% of NNs, having only comprised 5.9% of the archive; and fields from the BRAN experiments account for 7.4% of NNs, having contributed only 4.4% to the archive.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Percentage of NNs identified from each model/source, along with the percentage of the total model archive that is from each source.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="bottom" rowspan="2" align="left">Source</th>
<th valign="bottom" rowspan="2" align="left">Runs</th>
<th valign="middle" colspan="2" align="center">Exp. 1</th>
<th valign="middle" colspan="2" align="center">Exp. 17</th>
</tr>
<tr>
<th valign="middle" align="center">%NNs</th>
<th valign="middle" align="center">%Archive</th>
<th valign="middle" align="center">%NNs</th>
<th valign="middle" align="center">%Archive</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">OFAM IAF</td>
<td valign="middle" align="left">EISP+JRSP.</td>
<td valign="middle" align="center"><bold>8.6%</bold></td>
<td valign="middle" align="center">6.9%</td>
<td valign="middle" align="center">5.6%</td>
<td valign="middle" align="center">5.6%</td>
</tr>
<tr>
<td valign="middle" align="left">OFAM RA</td>
<td valign="middle" align="left">BR20+BR23</td>
<td valign="middle" align="center">0.0%</td>
<td valign="middle" align="center">0.0%</td>
<td valign="middle" align="center"><bold>7.4%</bold></td>
<td valign="middle" align="center">4.4%</td>
</tr>
<tr>
<td valign="middle" align="left">OA</td>
<td valign="middle" align="left">OCUR+SSDU</td>
<td valign="middle" align="center">0.0%</td>
<td valign="middle" align="center">0.0%</td>
<td valign="middle" align="center"><bold>11.5%</bold></td>
<td valign="middle" align="center">5.9%</td>
</tr>
<tr>
<td valign="middle" align="left">OFAM RYF</td>
<td valign="middle" align="left">CM85+Y79R</td>
<td valign="middle" align="center">10.0%</td>
<td valign="middle" align="center">15.3%</td>
<td valign="middle" align="center">17.3%</td>
<td valign="middle" align="center">21.8%</td>
</tr>
<tr>
<td valign="middle" align="left">LICOM IAF</td>
<td valign="middle" align="left">C100</td>
<td valign="middle" align="center">11.3%</td>
<td valign="middle" align="center">13.6%</td>
<td valign="middle" align="center">8.0%</td>
<td valign="middle" align="center">10.8%</td>
</tr>
<tr>
<td valign="middle" align="left">ACCESS-OM2&#x2013;01 IAF</td>
<td valign="middle" align="left">AOM1-4</td>
<td valign="middle" align="center"><bold>38.1%</bold></td>
<td valign="middle" align="center">30.3%</td>
<td valign="middle" align="center"><bold>27.3%</bold></td>
<td valign="middle" align="center">24.3%</td>
</tr>
<tr>
<td valign="middle" align="left">ACCESS-OM2&#x2013;01 RYF</td>
<td valign="middle" align="left">AOMR</td>
<td valign="middle" align="center">26.6%</td>
<td valign="middle" align="center">28.7%</td>
<td valign="middle" align="center">19.4%</td>
<td valign="middle" align="center">23.0%</td>
</tr>
<tr>
<td valign="middle" align="left">OFES1 CLIM</td>
<td valign="middle" align="left">OFSC</td>
<td valign="middle" align="center">0.5%</td>
<td valign="middle" align="center">1.0%</td>
<td valign="middle" align="center">0.4%</td>
<td valign="middle" align="center">0.8%</td>
</tr>
<tr>
<td valign="middle" align="left">OFES2 RYF</td>
<td valign="middle" align="left">OFSR</td>
<td valign="middle" align="center"><bold>4.9%</bold></td>
<td valign="middle" align="center">4.2%</td>
<td valign="middle" align="center">3.1%</td>
<td valign="middle" align="center">3.4%</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Results are shown for two experiments: Exp. 1 include archived SLA fields from EISP, JRSP, CM85, Y79R, C100, AOM*, OFSC, and OFSR; and Exp. 17 includes the same fields as Exp. 1, plus BR20, BR23, OCUR, and SSDU. The percentages in bold are when the percentage of NNs exceeds the percentage of fields in the archive.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Ensemble forecasts</title>
<p>To examine the mean characteristics of the ensemble forecasts, we present mean rank histograms (<xref ref-type="bibr" rid="B39">Hamill, 2001</xref>) for each region &#x2013; averaged over forecast days 0&#x2013;15 for 25 forecasts &#x2013; in <xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>. The histograms reveal clear and spatially systematic differences in ensemble performance across the 12 regions. Several regions exhibit a pronounced U-shape (e.g., regions 3, 4, 8, and 9), indicating that the ensemble spread is generally under-dispersive and that observations frequently fall outside the ensemble range (e.g., <xref ref-type="bibr" rid="B39">Hamill, 2001</xref>). Region 2 displays a dome-shaped distribution, suggesting an over-dispersive ensemble. Other regions &#x2013; particularly regions 6, 7, and 10 &#x2013; show flatter, more uniform histograms that imply a more appropriate spread. Regions with strong skewness towards the lowest or highest ranks (e.g., regions 3, 4, 8, and 12) indicate localised biases in the ensemble mean.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Mean rank histograms, averaged over day 0&#x2013;15 of 25 forecasts for each region, labelled in each panel <bold>(a-l)</bold>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g008.tif">
<alt-text content-type="machine-generated">Twelve bar graphs depict the rank probabilities for different regions across a map of Australia. Each graph shows the probability distribution (P(rank)) for ranks one to thirteen. The graphs illustrate varied distributions, with some showing a uniform spread, while others are skewed or have peaks at certain ranks. Each graph corresponds to a specific region labeled from one to twelve on the map above the graphs.</alt-text>
</graphic></fig>
<p>Overall, the rank histograms indicate that the analog-based ensembles capture important aspects of forecast uncertainty, although the spread is insufficient in a number of regions and occasionally exhibits systematic skewness. These deficiencies likely reflect limitations in the diversity or representativeness of the analog archive, rather than issues associated with ensemble data assimilation. The poorest-performing regions (3, 4, 8, 9, and 12) show clear U-shaped histograms, consistent with under-dispersion. In three of these regions (3, 4, and 9), the analog ensemble usually underperforms relative to OMv4.0i (<xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6</bold></xref>, <xref ref-type="fig" rid="f7"><bold>7</bold></xref>). This suggests that kNN performance could be improved by expanding or diversifying the archive so that the selected states span a broader range of independent dynamical conditions.</p>
<p>To further illustrate forecast performance and practical application, we present a number of detailed examples (<xref ref-type="fig" rid="f9"><bold>Figures&#xa0;9</bold></xref>&#x2013;<xref ref-type="fig" rid="f13"><bold>13</bold></xref>). Each example shows the verifying analyses, equal-weighted NN ensemble means, and forecasts from 12 individual NNs at t+0, t+5, t+10, and t+15. Results described in this section are from Exp. 1, using only SLA fields from free-running models. The examples discussed below include a mix of cases when the analog forecast system performs well, and some where it performs poorly. To further demonstrate the performance, we also offer results from 35 other examples (2 or 3 for each region) in the <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material</bold></xref>.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Example 1: Analog forecasts for the EAC domain (Region 1, <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>) for a forecast starting on 2 January 2023, showing Ocean Current analyses <bold>(a-d)</bold>, the equal-weighted NN ensemble mean (a0-d0), and the 12 NNs (a1-a12 &#x2013; a12-d12). The source (model and model run) for each NN is indicated to the left of each sequence of NN fields, along with the month and year of each NN. SLA for are shown at (column a) t+0, (column b) <italic>t</italic> + 5<italic>d</italic>, (column c) <italic>t</italic> + 10d, and (column d) <italic>t</italic> + 15<italic>d</italic>. The ACC for the ensemble mean (black) and each NN (coloured) are shown, as a function of lead time, in panel <bold>(e)</bold>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g009.tif">
<alt-text content-type="machine-generated">Grid of contour maps and a line graph showing sea level anomalies over lead times of zero to fifteen days. Each row represents different models, labeled such as O2-Curr, EQW NN, NN1 to NN12. The line graph on the top right indicates the anomaly correlation coefficient over time, with various colored lines representing different models. A color scale below spans blue to red, representing sea level anomaly values from negative zero point six to positive zero point six meters. The map locations are between 152 to 156 degrees east and 31 to 35 degrees south.</alt-text>
</graphic></fig>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p><bold>(a-d)</bold> Example 2: As for <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>, for the EAC domain (Region 1, <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>) for forecasts starting on 18 March 2023.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g010.tif">
<alt-text content-type="machine-generated">Grid of contour plots and a line graph. Contour plots labeled (a) to (d12) display sea level anomalies (SLA) over time at different conditions and model settings, with color gradients indicating variations. The line graph shows anomaly correlation coefficient (ACC) over a 15-day lead time for various neural network models. Multiple lines represent different models with a legend. The time steps are t+0, t+5, t+10, and t+15. A color bar at the bottom ranges from -0.6 to 0.6 meters of SLA.</alt-text>
</graphic></fig>
<fig id="f11" position="float">
<label>Figure&#xa0;11</label>
<caption>
<p><bold>(a-d)</bold> Example 3: As for <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>, except for the Lombok domain (Region 8, <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>) for forecasts starting on 28 November 2023.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g011.tif">
<alt-text content-type="machine-generated">The image contains a series of panels showing predicted sea level anomalies (SLA) at various lead times (t+0, t+5, t+10, t+15). The panels are organized in rows representing different neural network models, labeled NN1 to NN12. Each panel uses a color gradient to represent SLA values, ranging from blue (negative anomalies) to red (positive anomalies). Graph (e) at the top right corner displays a plot of the Anomaly Correlation Coefficient (ACC) against lead time, with different lines for each model. A legend at the top specifies the models corresponding to each line style.</alt-text>
</graphic></fig>
<fig id="f12" position="float">
<label>Figure&#xa0;12</label>
<caption>
<p><bold>(a-d)</bold> Example 4: As for <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>, except for the Perth domain (Region 11, <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>) and for forecasts starting on 16 July 2023.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g012.tif">
<alt-text content-type="machine-generated">A grid of maps on the left displays sea level anomalies over time in various models, with orange indicating high anomalies and blue indicating low. Each row corresponds to different neural network models. On the right, a line graph shows the anomaly correlation coefficient (ACC) against lead time, comparing several models. Each model's performance is marked with distinct colored and patterned lines. The x-axis indicates lead time in days, and the y-axis represents the ACC. A color scale below maps indicates the sea level anomaly range in meters.</alt-text>
</graphic></fig>
<fig id="f13" position="float">
<label>Figure&#xa0;13</label>
<caption>
<p><bold>(a-d)</bold> Example 5: As for <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref>, except for the GAB domain (Region 12, <xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>) and for forecasts starting on 17 May 2023.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g013.tif">
<alt-text content-type="machine-generated">A grid of maps showing sea level anomalies (SLA) in meters, ranging from -0.4 to 0.4, across various lead times (0 to 15 days). Each row represents a different dataset or model, labeled accordingly. The image shows color variations from blue to red, indicating SLA changes over time. A line graph in the top right shows Anomaly Correlation Coefficients (ACC) over lead time for different models, with a black line representing the mean.</alt-text>
</graphic></fig>
<p>Interestingly, for most cases, the initial conditions of each NN (at t+0) are often quite different from the verifying analyses at t+0. This is not surprising, because each NN is identified based on their similarity to observed evolution over a 10-day period, not necessarily their initial state (at t+0).</p>
<sec id="s4_3_1">
<label>4.3.1</label>
<title>Example 1: Eastern Australian Current Region</title>
<p><xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9</bold></xref> shows an ensemble forecast for the EAC domain (Region 1), initialised on 2 January 2023. The dominant feature at t+0 is a cyclonic eddy at &#x223c;32<sup>&#x25e6;</sup>S. Over the first week, this eddy splits into two smaller cyclonic eddies, one of which elongates meridionally and merges with shelf waters. By t+15, the verifying analysis shows a weakened, isotropic cyclonic eddy near 155<sup>&#x25e6;</sup>E.</p>
<p>Several NNs (NN4, NN10, NN11, and NN12) reproduce these key features well. The verifying analysis also indicates a cyclonic feature emerging by t+10 in the northeastern corner of the domain. While NN4 and NN12 capture this feature to some extent, none of the NNs predict it accurately.</p>
<p>Among all forecasts, NN10 has the highest ACC at t+15 (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9e</bold></xref>), forecasting the details of the small cyclonic eddy at 32<sup>&#x25e6;</sup>S, and realistically forecasting the distortion of the surrounding high-pressure system (the orange region in the south-east of the domain, <xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9d</bold></xref>), and the low sea level along the coast.</p>
</sec>
<sec id="s4_3_2">
<label>4.3.2</label>
<title>Example 2: EAC&#x2014;High Variability Case</title>
<p><xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10</bold></xref> provides another example from the EAC domain, chosen to highlight a case where SLA undergoes significant changes during the forecast period. At t+0, two cyclonic eddies are evident in the northern half of the domain. These eddies coalesce into a single, stronger cyclonic eddy within the first 5 days and then drift southward. Only about half of the NNs (NN1, NN2, NN6, NN7, NN11) capture both initial eddies. All NNs that correctly represent these features in their initial conditions predict their coalescence. By t+15, NN1 has the highest ACC, with a correlation of about 0.7.</p>
</sec>
<sec id="s4_3_3">
<label>4.3.3</label>
<title>Example 3: Lombok domain</title>
<p>The Lombok domain (Region 8) exhibits variability that is quite different to the EAC domain. <xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11</bold></xref> presents a forecast for a period when a low-pressure anomaly near Lombok Strait pinches off from the coast, forming a strong, quasi-isotropic cyclonic eddy. This development is well forecasted by most of the NNs, and is well-represented in the ensemble mean.</p>
<p>Again, <xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11e</bold></xref> shows that the most precise forecast is not from the ensemble mean and is not from NN1, but is from NN7. By t+15, the SLA forecast error for NN7 is less than 4 cm and with an ACC of over 0.8. For comparison, the SLA signal during this event exceeds 30 cm, indicating that this forecast has a small error relative to the signal.</p>
</sec>
<sec id="s4_3_4">
<label>4.3.4</label>
<title>Example 4: Perth Region&#x2014;Complex Eddy Fields</title>
<p><xref ref-type="fig" rid="f12"><bold>Figure&#xa0;12</bold></xref> shows an ensemble of SLA forecasts for the Perth domain (Region 11). This case is notable for the presence of multiple small-scale mesoscale features. At t+0, the verifying analysis includes at least five distinct mesoscale features. While many NNs contain multiple mesoscale features, most fail to match the correct intensity or precise position of all mesoscale features. This highlights one of the challenges of ocean forecasting - the problem of high dimensionality. Even using two-dimensional SLA fields, the ocean can include many small-scale features that are challenging to quantitatively reproduce in a model.</p>
<p>Despite the complexity in this example, some NNs &#x2013; particularly NN6 and NN10 &#x2013; produce forecasts that may be useful to an end user. These NNs capture most of the mesoscale features, albeit with differences in intensity and location.</p>
<p>In general, we expect that the analog forecasting approach may not produce reliable forecasts for this type of scenario. However, experienced end users may recognise the inherent uncertainty in such cases and adjust their expectations accordingly.</p>
</sec>
<sec id="s4_3_5">
<label>4.3.5</label>
<title>Example 5: Great Australian Bight</title>
<p>The final example (<xref ref-type="fig" rid="f13"><bold>Figure&#xa0;13</bold></xref>) is for the Great Australian Bight (GAB), near the Bonney Coast (Region 12). The circulation in this region is known to be strongly wind-driven (<xref ref-type="bibr" rid="B64">Middleton and Bye, 2007</xref>). Because of this, we expect that selection of NNs based solely on initial conditions (or more precisely, conditions preceding t+0) will likely fail to predict developing wind-driven events. This limitation is evident in this example &#x2013; with different NNs capturing wind-driven variability at different times leading to high SLA variability in the northeastern corner of the domain. However, the verifying analysis does not show this variability. This highlights a case where NN forecasting may be unsuitable. An option to try to address this could involve using forecast winds to identify NNs for wind-driven regions &#x2013; though we haven&#x2019;t explored this possibility.</p>
</sec>
<sec id="s4_3_6">
<label>4.3.6</label>
<title>Summary</title>
<p>These examples demonstrate the strengths and limitations of kNN and analog forecasting for predicting the mesoscale ocean circulation. While this method can effectively capture mesoscale features, NN selection based on conditions preceding t+0 alone may perform unreliably in regions dominated by wind forcing or complex eddy interactions. However, by considering forecast uncertainty and ensemble behaviour, end users may be able to interpret forecast reliability and adjust their expectations accordingly.</p>
</sec>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>Sensitivity experiments</title>
<p>A key question in ensemble data assimilation studies relates to the optimal ensemble size. For this study, this is the same as seeking the optimal number of NNs for each forecast. The efficiency of the kNN approach readily permits performance of a comprehensive set of sensitivity tests.</p>
<p>For each forecast, we calculate the MAD between the ensemble mean of the first 1, 2&#xb7;&#xb7;&#xb7;100 NNs and the verifying analyses (from OceanCurrent). <xref ref-type="fig" rid="f14"><bold>Figure&#xa0;14</bold></xref> shows the average MAD as a function of ensemble size, averaged over all 300 forecasts (25 forecasts across 12 domains). While no single optimal ensemble size is evident, averaging 10&#x2013;25 NNs seems to produces the most accurate ensemble-mean forecast. This result guided our choice of 12 NNs for results presented in this study.</p>
<fig id="f14" position="float">
<label>Figure&#xa0;14</label>
<caption>
<p>MAD plotted as a function of ensemble size. Statistics are calculated from 25 15-day forecasts for 12 domains (a total of 300 forecasts). The optimal ensemble size is not well-defined &#x2013; ranging from about 9 to 20 &#x2013; but the minimal average MAD is achieved with an ensemble size of 12 for the cases considered here.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-12-1729116-g014.tif">
<alt-text content-type="machine-generated">A line graph illustrating the relationship between ensemble size and Mean Absolute Deviation (MAD) in meters. The MAD decreases sharply from 0.052 to approximately 0.042 as ensemble size increases from 0 to 10, then stabilizes and slightly increases after ensemble size 25 up to 100.</alt-text>
</graphic></fig>
<p>Compared to traditional ocean forecast systems, there are relatively few &#x201c;tuneable parameters&#x201d; in an analog forecast system. However, results can be sensitive to the data included in the archive and the method used to identify NNs. We summarise a series of sensitivity experiments in <xref ref-type="table" rid="T3"><bold>Table&#xa0;3</bold></xref>. This includes experiments using different sources of SLA in the archive, using a different metric for identifying NNs, using a different observation window for identification of the NNs, and using a different ensemble size. We present these mean statistics to demonstrate the sensitivity, but we have not applied the same rigorous statistical tests that we applied the results in <xref ref-type="fig" rid="f6"><bold>Figures&#xa0;6</bold></xref>, <xref ref-type="fig" rid="f7"><bold>7</bold></xref>. Here, we aim merely to quantify the sensitivity, rather than definitively identify the &#x201c;optimal&#x201d; configuration.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Average ACC for forecast day 1&#x2013;6 for each forecast experiment and for each domain.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="bottom" rowspan="2" align="left">Experiment</th>
<th valign="middle" colspan="12" align="center">ACC</th>
</tr>
<tr>
<th valign="middle" align="center">1</th>
<th valign="middle" align="center">2</th>
<th valign="middle" align="center">3</th>
<th valign="middle" align="center">4</th>
<th valign="middle" align="center">5</th>
<th valign="middle" align="center">. 6</th>
<th valign="middle" align="center">7</th>
<th valign="middle" align="center">8</th>
<th valign="middle" align="center">9</th>
<th valign="middle" align="center">10</th>
<th valign="middle" align="center">11</th>
<th valign="middle" align="center">12</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">OceanMAPSv4.0i</td>
<td valign="middle" align="center">0.72</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.72</td>
<td valign="middle" align="center"><bold>0.85*</bold></td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">0.61</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.67</td>
<td valign="middle" align="center">0.64</td>
<td valign="middle" align="center">0.49</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.1 (ACC ID w/10 d)</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.84</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center"><bold>0.58</bold></td>
</tr>
<tr>
<td valign="middle" align="left">Exp.2 (E1 w/MAD ID)</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.72</td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center"><bold>0.83</bold></td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">0.54</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.3 (E1 w/4d)</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.84</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.72</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center"><bold>0.77</bold></td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">0.55</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.4 (E1 w/15d)</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.72</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.55</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.5 (E1 w/7d)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center"><bold>0.74</bold></td>
<td valign="middle" align="center">0.56</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.6 (E1+CM85)</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.84</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.72</td>
<td valign="middle" align="center"><bold>0.58</bold></td>
</tr>
<tr>
<td valign="middle" align="left">Exp.7 (E1-Y79R-C100-OF*)</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.53</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.8 (AOM4 w/10d)</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.64</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.50</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.9 (CM85+BR*)</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">0.72</td>
<td valign="middle" align="center"><bold>0.58</bold></td>
</tr>
<tr>
<td valign="middle" align="left">Exp.10 (E9 w/6d)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.56</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.11 (E9 w/5d)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center"><bold>0.77</bold></td>
<td valign="middle" align="center"><bold>0.74</bold></td>
<td valign="middle" align="center"><bold>0.58</bold></td>
</tr>
<tr>
<td valign="middle" align="left">Exp.12 (E9 w/7d)</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center"><bold>0.78</bold></td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.55</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.13 (E9 w/8d)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.55</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.14 (E12+OC)</td>
<td valign="middle" align="center"><bold>0.83</bold></td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center"><bold>0.78</bold></td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.55</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.15 (E14 w/5d)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center"><bold>0.77</bold></td>
<td valign="middle" align="center"><bold>0.74</bold></td>
<td valign="middle" align="center"><bold>0.58</bold></td>
</tr>
<tr>
<td valign="middle" align="left">Exp.16 (E14 + 12/36NNs)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center"><bold>0.78</bold></td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center"><bold>0.72</bold></td>
<td valign="middle" align="center"><bold>0.77</bold></td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center"><bold>0.58</bold></td>
</tr>
<tr>
<td valign="middle" align="left">Exp.17 (E14+SD)</td>
<td valign="middle" align="center"><bold>0.83</bold></td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.55</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.18 (E17 + 12/24NNs)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center"><bold>0.80</bold></td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center"><bold>0.78</bold></td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center"><bold>0.74</bold></td>
<td valign="middle" align="center">0.56</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.19 (E17 w/MAD ID)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center"><bold>0.83</bold></td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.52</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.20 (E17 w/MIX ID)</td>
<td valign="middle" align="center"><bold>0.83</bold></td>
<td valign="middle" align="center">0.84</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.55</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.21 (E17 w/6NNs)</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.84</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.68</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">0.54</td>
</tr>
<tr>
<td valign="middle" align="left">Exp.22 (E17 w/18NNs)</td>
<td valign="middle" align="center"><bold>0.83</bold></td>
<td valign="middle" align="center"><bold>0.85</bold></td>
<td valign="middle" align="center"><bold>0.78</bold></td>
<td valign="middle" align="center"><bold>0.78</bold></td>
<td valign="middle" align="center"><bold>0.80</bold></td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center"><bold>0.84</bold></td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center"><bold>0.74</bold></td>
<td valign="middle" align="center">0.56</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The &#x201c;best&#x201d; result from the analog forecast system for each domain is bold; and domains where OceanMAPSv4.0i produced the best forecasts are denoted by an asterisk. Experiment 1 includes data from 11 runs in the archive (EISP, JRSP, Y79R, C100, AOM1, AOM2, AOM3, AOM4, AOMR, OFSC, OFSJ), uses a 10-day observation window to identify NNs, and uses ACC to identify NNs (ACC ID). The differences from Experiment 1 are denoted in the first column (e.g., &#x201c;E9 w/7d&#x201d; means the same as Exp. 9, but with a 7 day observational window to identify NNs; &#x201c;+CM85&#x201d; means the same as Exp. 1, expect with data from CM85 in the archive; and &#x201c;-Y79R&#x201d; means the same as Exp. 1, except without data from Y79R in the archive).</p></fn>
</table-wrap-foot>
</table-wrap>
<p>Several general conclusions can be drawn from these sensitivity experiments. The observation window used for identifying NNs influences the forecast skill. Comparing experiments with an observation window of 4d (Exp. 3), 7d (Exp. 5), 10d (Exp. 1), and 15d (Exp. 4), suggests that 15d is too long, and 4d is too short. Further, we conclude that a 7d window produces the best forecasts. Inclusion of SLA data from additional, or fewer, sources in the archive also influences the forecast skill. We also find that there is some improvement when a larger ensemble is used &#x2013; though a more comprehensive assessment is warranted to strongly support this claim. Compare results with 12 members (Exp. 17), 6 members (Exp. 21), and 18 members (Exp. 22). For most cases, the results are intuitive, with inclusion of more data improving the forecast skill, and using less data degrading the forecast skill.</p>
<p>Overall, we find some sensitivities to different choices of configuration of the analog forecast system. Different domains seem to warrant different configurations. Noting the computational efficiency of this system, it&#x2019;s possible that every individual domain could be tuned for the best performance. However, we also note that the range of ACC for experiments presented in <xref ref-type="table" rid="T3"><bold>Table&#xa0;3</bold></xref> is small, so the improvement in forecast skill gained by tuning is not great. In fact, most of the differences reported here are not statistically significant, again highlighting the insensitivity of the kNN/analog approach to these choices.</p>
</sec>
</sec>
<sec id="s5" sec-type="discussion">
<label>5</label>
<title>Discussion</title>
<sec id="s5_1">
<label>5.1</label>
<title>Advantages of analog forecasting</title>
<p>Although kNN or analog forecasting is not yet widely used in oceanography, this study demonstrates its significant potential for mesoscale ocean forecasting. Compared to traditional ocean forecast systems, analog forecasting offers several advantages.</p>
<p>First, analog forecasting can produce dynamically consistent forecasts, avoiding the rapid degradation often seen with sequential data assimilation. This may be particularly beneficial for scenarios that are sensitive to dynamical imbalance, including forecasts of the mesoscale ocean circulation (e.g., <xref ref-type="bibr" rid="B79">Pilo et&#xa0;al., 2018</xref>) and biogeochemical (BGC) forecasting (e.g., <xref ref-type="bibr" rid="B82">Raghukumar et&#xa0;al., 2015</xref>). Analog forecasting can completely mitigate these issues by ensuring dynamic consistency in the forecast fields.</p>
<p>Second, analog forecasting allows targeted predictions for a subset of ocean variables (e.g., SLA, SST, or surface phytoplankton) without requiring a full ocean state to be predicted for every forecast. In this study, we chose to forecast only SLA, making our system computational efficiency, but still relevant to a number of end users. By contrast, traditional numerical models have to compute the entire ocean state for each forecast, even if the intent of the system is to forecast a subset of variables (e.g., SLA in one region).</p>
<p>Third, our approach is efficient and cost-effective. We generated an ensemble of 15-day forecasts for a 5<sup>&#x25e6;</sup> &#xd7; 5<sup>&#x25e6;</sup> domain in about 90 seconds using a modest virtual machine (with 4 Intel Xeon Gold 6430 cores and 14 GB RAM under VMware virtualization). By contrast, OceanMAPS4.0i, the operational forecast system used for benchmarking, requires approximately 7,000 CPU hours (or 420,000 CPU minutes) to generate a global 6-day forecast, as reported in the 2023 OceanPredict National Report. The results in this study, for example, used 25 global OceanMAPS forecasts that were produced on a high-performance super-computer and required almost 20 CPU years to complete; and 300 regional analog forecasts (12 domains by 25 forecasts), required about 7.5 CPU hours. The computational cost of our analog approach is therefore about 25,000 times less than a traditional ocean forecasting system for this study.</p>
<p>Finally, the analog method can function as a multi-system tool. The model archive can incorporate fields from different models, configurations, and resolutions (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). Since all models exhibit some systematic biases (e.g., excessive mixing, misplaced boundary currents, deep mixed layers), including multiple models allows the system to preferentially select NNs that minimise systematic errors.</p>
</sec>
<sec id="s5_2">
<label>5.2</label>
<title>Limitations of analog forecasting</title>
<p>Despite its advantages, analog forecasting has several limitations. Every analog forecast is merely selected from the model archive. The system can only predict events that have analogs in the archive, meaning that extreme events (e.g., marine heatwaves) can only be forecasted if similar cases exist in the archive of model states. This limitation becomes particularly relevant under climate change, where unprecedented conditions may emerge. One potential mitigation is to incorporate model simulations forced by future climate projections (e.g., CM85, C100; <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>).</p>
<p>Another limitation is the dependence on observation quality and availability. If observations are sparse or lack adequate spatiotemporal coverage, selected NNs may be suboptimal, degrading forecast skill. To mitigate this, we used a 10-day sequence of observations for NN selection. Incorporating additional observation types (e.g., satellite SST or Argo profiles) is another avenue for improvement, as is combining analog forecasting with other model-data synthesis techniques (e.g., <xref ref-type="bibr" rid="B87">Rykova, 2023</xref>).</p>
<p>Moreover, analog forecasting is best suited for regional domains. Applying it at global or even basin scale is impractical due to the high dimensionality of ocean states. kNN methods are known to become unstable in high-dimensional spaces (e.g., <xref ref-type="bibr" rid="B78">Pestov, 2013</xref>). For this study, we performed experiments to systematically test domain sizes (from 3<sup>&#x25e6;</sup> &#xd7; 3<sup>&#x25e6;</sup> to 10<sup>&#x25e6;</sup> &#xd7; 10<sup>&#x25e6;</sup>) and found that smaller domains generally yield more accurate forecasts. A 5<sup>&#x25e6;</sup> &#xd7; 5<sup>&#x25e6;</sup> domain was chosen to balance accuracy and usability (i.e., we expect that a forecast on 500x500 km domain will be useful for many end users).</p>
<p>Global applications of analog forecasting would seem out of reach. Such an approach would require mesoscale features (e.g., eddies) across multiple ocean regimes to align, which is unlikely. <xref ref-type="bibr" rid="B57">Lorenz (1969)</xref> faced a similar issue when searching for analogs in atmospheric forecasting that included the entire northern hemisphere, noting that &#x201c;there are numerous mediocre analogs but no truly good ones&#x201d;. While global applications seem unrealistic, regional implementations show good potential.</p>
</sec>
<sec id="s5_3">
<label>5.3</label>
<title>Model archive considerations</title>
<p>The archive of SLA fields used here (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>) are mostly from models, and mostly include two types of model runs - simulations with IAF and climatological, or RYF. Our results (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>) suggest that interannual forcing yields better performance for analog forecasting, though fields from climatological runs remain valuable given the chaotic nature of mesoscale circulation.</p>
<p>Currently, all models in our archive are based on the MOM. Expanding the archive to include simulations from other models such as NEMO (<xref ref-type="bibr" rid="B60">Madec, 2016</xref>), the MIT GCM (<xref ref-type="bibr" rid="B2">Adcroft et&#xa0;al., 2004</xref>), or HYCOM (<xref ref-type="bibr" rid="B18">Chassignet et&#xa0;al., 2007</xref>) could further improve forecast skill.</p>
<p>Although most of the results presented in this study use SLA fields from free-running models, with no data assimilation, we have also performed forecasts using fields from ocean reanalyses and observation-based analyses (<xref ref-type="table" rid="T1"><bold>Tables&#xa0;1</bold></xref>-<xref ref-type="table" rid="T3"><bold>3</bold></xref>). When these additional sources are included, we find that many NNs are identified from these datasets (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>) and the forecast skill typically improved (<xref ref-type="table" rid="T3"><bold>Table&#xa0;3</bold></xref>). Close inspection of the ensuring forecasts from these sources (not shown) expose the problems with these datasets - often with noticeable discontinuities in SLA over the forecast period. The tradeoff between improved forecast skill and dynamical inconsistent forecasts is something that needs to be considered for any application.</p>
</sec>
<sec id="s5_4">
<label>5.4</label>
<title>Selection of NNs</title>
<p>In our experiments, we chose to use ACC between along-track altimetry and model SLA fields to select NNs. We also ran a comprehensive set of experiments using MAD, which yielded similar selections. However, forecasts using ACC to select NNs resulted in better agreement with verifying analyses.</p>
<p>For SLA forecasting, we think ACC is the most appropriate metric because the primary goal of the system is to provide qualitative guidance. In this context, accurately predicting the location, size, and shape of mesoscale features is more important than precisely matching their amplitude, or the amplitude of SLA over a broader area.</p>
<p>The most commonly used error metrics are MAD, Mean Squared Difference (MSD), and ACC. These metrics are mathematically related. For a Gaussian sample, MSD &#x2248; <italic>&#x3c0;</italic>/2 MAD<sup>2</sup>. Furthermore, MSD can be formally expressed in terms of ACC. The MSD (<xref ref-type="disp-formula" rid="eq1">Equation 1</xref>) between two vectors <italic>X</italic> and <italic>Y</italic> can be expressed as:</p>
<disp-formula id="eq1"><label>(1)</label>
<mml:math display="block" id="M1"><mml:mrow><mml:mtext>MSD</mml:mtext><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>X</mml:mi><mml:mo>,</mml:mo><mml:mi>Y</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:msup><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>X</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mi>Y</mml:mi></mml:mrow><mml:mo stretchy="true">&#xaf;</mml:mo></mml:mover></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>&#x3c3;</mml:mi><mml:mi>X</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>&#x3c3;</mml:mi><mml:mi>Y</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mn>2</mml:mn><mml:msub><mml:mi>&#x3c3;</mml:mi><mml:mi>X</mml:mi></mml:msub><mml:msub><mml:mi>&#x3c3;</mml:mi><mml:mi>Y</mml:mi></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:mtext>ACC</mml:mtext></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>,</mml:mo></mml:mrow></mml:math>
</disp-formula>
<p>where MSD is the mean squared difference, <inline-formula>
<mml:math display="inline" id="im2"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>X</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mi>Y</mml:mi></mml:mrow><mml:mo stretchy="true">&#xaf;</mml:mo></mml:mover></mml:mrow></mml:math></inline-formula> is the bias, and <inline-formula>
<mml:math display="inline" id="im3"><mml:mrow><mml:msub><mml:mi>&#x3c3;</mml:mi><mml:mi>X</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im4"><mml:mrow><mml:msub><mml:mi>&#x3c3;</mml:mi><mml:mi>Y</mml:mi></mml:msub></mml:mrow></mml:math></inline-formula> are standard deviations of <inline-formula>
<mml:math display="inline" id="im5"><mml:mi>X</mml:mi></mml:math></inline-formula> and <inline-formula>
<mml:math display="inline" id="im6"><mml:mi>Y</mml:mi></mml:math></inline-formula> (e.g., <xref ref-type="bibr" rid="B67">Murphy, 1996</xref>; <xref ref-type="bibr" rid="B70">Oke et&#xa0;al., 2002a</xref>).</p>
<p>These relationships indicate that selecting NNs based on MAD (or MSD) implicitly incorporates comparisons of mean fields (close to zero in this case, since SLA is an anomaly); the amplitude of mesoscale features (quantified by standard deviation); and the location and shape of mesoscale features (quantified by the ACC). Since our objective is to produce forecasts that qualitatively inform decision making, we prioritise ACC for selecting NNs, as it better captures the spatial structure of mesoscale variability.</p>
</sec>
<sec id="s5_5">
<label>5.5</label>
<title>Comparison with ensemble data assimilation</title>
<p>While kNN and analog forecasting are not widely used in ocean forecasting, the approach shares similarities with ensemble data assimilation methods. It can be shown that a field of increments from EnOI- or EnKF-based systems can be expressed as a linear combination of ensemble anomalies (e.g., <xref ref-type="bibr" rid="B76">Oke et&#xa0;al., 2007</xref>, <xref ref-type="bibr" rid="B74">2021</xref>). Moreover, one of the key advantages of EnKF over EnOI is that the EnKF generates ensemble members that are relevant to the current forecast (e.g., <xref ref-type="bibr" rid="B88">Sakov and Oke, 2008</xref>), sometimes called the &#x201c;errors of the day&#x201d; (e.g., <xref ref-type="bibr" rid="B69">O&#x2019;Kane et&#xa0;al., 2011</xref>). An analog system also produces an ensemble mean of NNs (ensemble members) that are relevant to the current state. Here, we combine these NNs to produce an ensemble mean &#x2013; a linear combination of members. We can therefore see that in this way, this approach is similar to EnOI and EnKF, but at a fraction of the computational cost. However, unlike EnOI or the EnKF, analog forecasting does not exploit this ensemble to assimilate data. An ensemble of analog forecasts are merely intended to produce multiple estimates of possible future conditions.</p>
<p>When ensembles are used by traditional forecast systems, the ensemble is used both as an ensemble prediction, and to quantify the system&#x2019;s error covariance, for data assimilation. When used for data assimilation, the system generally performs better when a large ensemble is used (e.g., <xref ref-type="bibr" rid="B66">Mitchell et&#xa0;al., 2002</xref>). While this may also be useful for ensemble prediction, the quantity of forecasts may become unmanageable for users to exploit.</p>
</sec>
<sec id="s5_6">
<label>5.6</label>
<title>Interpreting ensembles</title>
<p>In ensemble forecasting, the ensemble mean is often considered the primary output (e.g., <xref ref-type="bibr" rid="B21">Counillon et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B89">Sakov and Sandery, 2015</xref>; <xref ref-type="bibr" rid="B3">Aijaz et&#xa0;al., 2023</xref>). However, as shown in <xref ref-type="fig" rid="f9"><bold>Figures&#xa0;9</bold></xref>-<xref ref-type="fig" rid="f13"><bold>13</bold></xref>, individual ensemble members can provide valuable insight, particularly for mesoscale feature prediction.</p>
<p>End users may benefit from considering both the ensemble mean and individual forecasts. A key question is whether the ensemble mean is always the best metric for assessing forecast skill. The goal of an ensemble forecast is to represent a range of plausible future states. Even if the ensemble mean is inaccurate, the system succeeds if at least one ensemble member closely matches reality. This perspective is common in atmospheric forecasting and could be more widely adopted in oceanography.</p>
<p>For many of the examples presented here (<xref ref-type="fig" rid="f9"><bold>Figures&#xa0;9</bold></xref>-<xref ref-type="fig" rid="f13"><bold>13</bold></xref> and in the <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material</bold></xref>), the most skilful forecast is often one of the NNs, not the ensemble mean of NNs. This may be true for traditional ensemble data assimilation systems, and is something that warrants consideration.</p>
</sec>
<sec id="s5_7">
<label>5.7</label>
<title>On the value of forecasting a subset of the ocean state</title>
<p>In this study, we demonstrate that analog forecasts can outperform traditional forecasts for a subset of variables. Applications to NWP drew similar conclusions (e.g., <xref ref-type="bibr" rid="B56">Langmack et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B68">Nagarajan et&#xa0;al., 2015</xref>). Here, we consider the potential value of forecasting only a subset of the ocean state, compared to the entire state. Many marine industries rely on ocean forecasts to guide decision-making (e.g., <xref ref-type="bibr" rid="B53">Kourafalou et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B94">Schiller et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B84">Rautenbach and Blair, 2021</xref>; <xref ref-type="bibr" rid="B20">Ciliberti et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B97">Spillman et&#xa0;al., 2025</xref>). Most forecasts provided by national weather centres offer a comprehensive suite of data and products (e.g., <xref ref-type="bibr" rid="B12">Brassington et&#xa0;al., 2023</xref>). However, many end users do not fully exploit these forecasts. Instead, they tend to make decisions based on qualitative assessments &#x2013; simply analysing images of predicted conditions (e.g., <xref ref-type="bibr" rid="B42">H&#xf6;llt et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B55">Kuonen et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B97">Spillman et&#xa0;al., 2025</xref>) or considering indices that summarise broad-scale conditions (e.g., <xref ref-type="bibr" rid="B54">Kumar et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B95">Siedlecki et&#xa0;al., 2023</xref>), and making modest adjustments to their plans. This is especially true for industries sensitive to mesoscale ocean variability, including oil and gas, fisheries, search and rescue, shipping, and Defence.</p>
<p>For example, the operator of a fishing vessel might target a specific ocean feature, such as a cyclonic eddy. Their interest is likely in the location and intensity of a specific eddy (e.g., <xref ref-type="bibr" rid="B107">Xing et&#xa0;al., 2023</xref>). A shipping company might seek deviations from a direct port-to-port route, modestly adjusting their path only if favourable conditions are likely (e.g., <xref ref-type="bibr" rid="B27">Dickson et&#xa0;al., 2019</xref>). In search and rescue, identifying the current and near-future direction of surface currents is likely most crucial (e.g., <xref ref-type="bibr" rid="B85">Rosebrock et&#xa0;al., 2015</xref>). For defence, the presence or absence of strong mesoscale features could present risks or opportunities in undersea warfare (e.g., <xref ref-type="bibr" rid="B14">Bub et&#xa0;al., 2014</xref>). Oil and gas operations may need to anticipate strong currents that could jeopardise exploratory activities or to support incidents like oil spill response (e.g., <xref ref-type="bibr" rid="B58">Lubchenco et&#xa0;al., 2012</xref>). Most of these considerations may be associated with strong mesoscale eddies in their area of operation. For all these applications, a reliable forecast of SLA, from which estimates of geostrophic currents can readily be calculated, is likely to be valuable. Moreover, for many applications, a detailed forecast of subsurface properties may be unnecessary. Analog forecasting offers an approach that allows a subset of variables to be predicted, and may be a sensible option for many applications.</p>
</sec>
</sec>
<sec id="s6">
<label>6</label>
<title>Psuedo-code</title>
<p>The code for performing a kNN/analog forecast is uncomplicated. We present the pseudo-code for this system below, including each step to initialise the system, identify the NNs, and evaluate each forecast.</p>
<p>Pseudo-code for kNN/analog system</p>
<p>1. Initialise experiment</p>
<list list-type="simple">
<list-item>
<p>- Load experiment parameters (e.g., variable, archive datasets, etc.).</p></list-item>
<list-item>
<p>- Load archive metadata.</p></list-item>
<list-item>
<p>- Set region loop.</p></list-item>
</list>
<p>2. For each region:</p>
<p>2.1 Load archive</p>
<list list-type="simple">
<list-item>
<p>- For each archived dataset (i.e., model runs):</p>
<list list-type="simple">
<list-item>
<p>* Read time, grid, variable.</p></list-item>
<list-item>
<p>* Remove times overlapping verification.</p></list-item>
<list-item>
<p>* Convert to anomalies if needed (subtract temporal mean).</p></list-item>
<list-item>
<p>* Interpolate to common grid if needed.</p></list-item>
</list></list-item>
<list-item>
<p>- Concatenate all datasets into archive.</p></list-item>
</list>
<p>2.2 Load verifying analysis grid</p>
<list list-type="simple">
<list-item>
<p>- Read OceanCurrent time, grid, variable.</p></list-item>
<list-item>
<p>- Subset to region.</p></list-item>
</list>
<p>3. Loop over forecasts:</p>
<p>For each forecast initialisation time:</p>
<p>3.1 Compute archive-observation similarity</p>
<list list-type="simple">
<list-item>
<p>- For each archive time:</p>
<list list-type="simple">
<list-item>
<p>* Interpolate archive to observation locations.</p></list-item>
<list-item>
<p>* Compute MAD and ACC.</p></list-item>
<list-item>
<p>* Mask archive times near gaps between datasets.</p></list-item>
</list></list-item>
</list>
<p>3.2 Select nearest neighbours</p>
<list list-type="simple">
<list-item>
<p>- Identify NN1 as the sequence with the highest ACC or lowest MAD.</p></list-item>
<list-item>
<p>- Exclude archive elements within 45 days of NN1, and identify NN2.</p></list-item>
</list>
<p>- Repeat for <italic>k</italic> NNs, where <inline-formula>
<mml:math display="inline" id="im7"><mml:mi>k</mml:mi></mml:math></inline-formula> is the ensemble size.</p>
<p>3.3 Assemble ensemble forecasts</p>
<list list-type="simple">
<list-item>
<p>- For each NN and lead time, extract SLA field.</p></list-item>
<list-item>
<p>- Build 4D ensemble array.</p></list-item>
</list>
<p>3.4 Compute ensemble forecasts</p>
<list list-type="simple">
<list-item>
<p>- Equal-weight (kNN EqW) forecast.</p></list-item>
<list-item>
<p>- Load benchmark (OMv4.0i) for comparison.</p></list-item>
</list>
<p>3.5 Evaluate skill statistics for all lead times (0&#x2013;15 days) for kNN and OMv4.0i.</p>
<list list-type="simple">
<list-item>
<p>- Compute ACC and MAD for ensemble mean.</p></list-item>
<list-item>
<p>- Compute ACC and MAD for each NN (ensemble member).</p></list-item>
</list>
<p>3.6 Rank histograms</p>
<list list-type="simple">
<list-item>
<p>- Compare verifying SLA to ensemble.</p></list-item>
<list-item>
<p>- Construct and store rank histogram.</p></list-item>
</list>
<p>3.7 Save outputs</p>
<list list-type="simple">
<list-item>
<p>- Save derived data (metrics, histograms, NN indices, etc.).</p></list-item>
<list-item>
<p>- Optional plots.</p></list-item>
</list>
<p>4. After all forecasts:</p>
<list list-type="simple">
<list-item>
<p>- Average statistics across all dates.</p></list-item>
<list-item>
<p>- Save summary figures and data files.</p></list-item>
</list>
<p>End.</p>
</sec>
<sec id="s7" sec-type="conclusions">
<label>7</label>
<title>Conclusions</title>
<p>Analog forecasting has been successfully applied in NWP (e.g., <xref ref-type="bibr" rid="B5">Bagtasa, 2021</xref>) and seasonal forecasting (e.g., <xref ref-type="bibr" rid="B102">Walsh et&#xa0;al., 2021</xref>). Similarly, kNN has a long history in classification and pattern recognition (e.g., <xref ref-type="bibr" rid="B34">Fix and Hodges, 1951</xref>; <xref ref-type="bibr" rid="B41">Hattori and Takahashi, 1999</xref>). In this study, we develop a kNN-based analog forecast system to predict regional SLA and demonstrated that this simple, computationally efficient approach can outperform traditional ocean forecast systems in many cases. Our results highlight the potential of analog forecasting as a complementary or alternative tool for mesoscale ocean prediction.</p>
<p>The kNN-based forecasting system may benefit end users whose decisions depend on mesoscale ocean features, such as eddies and boundary currents. This might include industries whose operations are sensitive to the location, strength, and evolution of eddies; to the location and intensity of fronts, and to the position and intensity of boundary currents. This includes industries such as fisheries, offshore energy, and shipping. Given its efficiency, adaptability and performance, analog forecasting represents a promising direction for future operational ocean forecasting.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="data-availability">
<title>Data availability statement</title>
<p>RADS satellite altimeter data are available at <uri xlink:href="http://rads.tudelft.nl">http://rads.tudelft.nl</uri>, with associated software at <uri xlink:href="https://github.com/remkos/rads">https://github.com/remkos/rads</uri> (last accessed on 26 March 2025). Data from ACCESS-OM2&#x2013;01 are available from <uri xlink:href="https://doi.org/10.4225/41/5a2dc8543105a">https://doi.org/10.4225/41/5a2dc8543105a</uri> (last accessed on 26 January 2025). Data from OFAM runs are available from <uri xlink:href="https://thredds.nci.org.au/thredds/catalog/gb6/OFAM3/OFAM3_EI_SPINUP/catalog.html">https://thredds.nci.org.au/thredds/catalog/gb6/OFAM3/OFAM3_EI_SPINUP/catalog.html</uri> and <uri xlink:href="https://dapds00.nci.org.au/thredds/catalog/gb6/OFAM3/OFAM3_BGC_2021/OUTPUT/catalog.html">https://dapds00.nci.org.au/thredds/catalog/gb6/OFAM3/OFAM3_BGC_2021/OUTPUT/catalog.html</uri> (last accessed on 28 January 2025). Data from the LICOM3 run are available at the Science Data Bank at <uri xlink:href="https://doi.org/10.11922/sciencedb.j00076.00095">https://doi.org/10.11922/sciencedb.j00076.00095</uri> (last accessed on 17 January 2025). OFES data are accessed from <uri xlink:href="https://apdrc.soest.hawaii.edu/datadoc/ofes/clim_0.1_global_1day.php">https://apdrc.soest.hawaii.edu/datadoc/ofes/clim_0.1_global_1day.php</uri> (last accessed on 26 February 2025). OceanMAPS analyses and forecasts were accessed from the Australian Bureau of Meteorology at <uri xlink:href="ftp://ftp-reg.cloud.bom.gov.au/register/username/nwp">ftp://ftp-reg.cloud.bom.gov.au/register/username/nwp</uri> at the time of each forecast and archived at CSIRO (last accessed on 19 February 2025). Analyses from IMOS OceanCurrent are available from <uri xlink:href="http://imos.aodn.org.au/oceancurrent">http://imos.aodn.org.au/oceancurrent</uri> (last accessed on 26 March 2025). The Ssalto/Duacs altimeter products were produced and distributed by the Copernicus Marine and Environment Monitoring Service (CMEMS) <uri xlink:href="https://marine.copernicus.eu/">https://marine.copernicus.eu/</uri> (last accessed on 2 April 2025).</p></sec>
<sec id="s9" sec-type="author-contributions">
<title>Author contributions</title>
<p>PO: Conceptualization, Formal analysis, Methodology, Software, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. TR: Conceptualization, Formal analysis, Methodology, Writing &#x2013; review &amp; editing.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>The authors offer sincere thanks to M. Chamberlain and A. Kiss for helping us identify and access model runs produced under Bluelink (<ext-link ext-link-type="uri" xlink:href="https://research.csiro.au/bluelink/">https://research.csiro.au/bluelink/</ext-link>) and COSIMA (<ext-link ext-link-type="uri" xlink:href="https://cosima.org.au">https://cosima.org.au</ext-link>), respectively; and to H. Sasaki for helping us access OFES data (<ext-link ext-link-type="uri" xlink:href="https://www.jamstec.go.jp/ofes/">https://www.jamstec.go.jp/ofes/</ext-link>). The authors also gratefully acknowledge R. Woodham and M. Chamberlain for comments that led to improvements in this study.</p>
</ack>
<sec id="s11" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s12" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s13" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s14" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmars.2025.1729116/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmars.2025.1729116/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.pdf" id="SM1" mimetype="application/pdf"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Acosta Navarro</surname> <given-names>J. C.</given-names></name>
<name><surname>Aranyossy</surname> <given-names>A.</given-names></name>
<name><surname>De Luca</surname> <given-names>P.</given-names></name>
<name><surname>Donat</surname> <given-names>M. G.</given-names></name>
<name><surname>Hrast Essenfelder</surname> <given-names>A.</given-names></name>
<name><surname>Mahmood</surname> <given-names>R.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Seamless seasonal to multi-annual predictions of temperature and standardized precipitation index by constraining transient climate model simulations</article-title>. <source>EGUsphere</source> <volume>2025</volume>, <fpage>1</fpage>&#x2013;<lpage>24</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/esd-16-1723-2025</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Adcroft</surname> <given-names>A.</given-names></name>
<name><surname>Hill</surname> <given-names>C.</given-names></name>
<name><surname>Campin</surname> <given-names>J.-M.</given-names></name>
<name><surname>Marshall</surname> <given-names>J.</given-names></name>
<name><surname>Heimbach</surname> <given-names>P.</given-names></name>
</person-group> (<year>2004</year>). &#x201c;
<article-title>Overview of the formulation and numerics of the MIT GCM</article-title>,&#x201d; in <source>Proceedings of the ECMWF seminar series on Numerical Methods, <italic>Recent developments in numerical methods for atmosphere and ocean modelling</italic></source><publisher-loc>Shinfield Park, Reading, UK</publisher-loc>: 
<publisher-name>ECMWF</publisher-name>, <fpage>139</fpage>&#x2013;<lpage>149</lpage>.
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Aijaz</surname> <given-names>S.</given-names></name>
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
<name><surname>Divakaran</surname> <given-names>P.</given-names></name>
<name><surname>R&#xe9;gnier</surname> <given-names>C.</given-names></name>
<name><surname>Dr&#xe9;villon</surname> <given-names>M.</given-names></name>
<name><surname>Maksymczuk</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Verification and intercomparison of global ocean Eulerian near-surface currents</article-title>. <source>Ocean. Model.</source> <volume>186</volume>, <fpage>102241</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2023.102241</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Arango</surname> <given-names>H. G.</given-names></name>
<name><surname>Levin</surname> <given-names>J.</given-names></name>
<name><surname>Wilkin</surname> <given-names>J.</given-names></name>
<name><surname>Moore</surname> <given-names>A. M.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>4D-Var data assimilation in a nested model of the Mid-Atlantic Bight</article-title>. <source>Ocean. Model.</source> <volume>184</volume>, <fpage>102201</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2023.102201</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bagtasa</surname> <given-names>G.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Analog forecasting of tropical cyclone rainfall in the Philippines</article-title>. <source>Weather. Climate Extremes.</source> <volume>32</volume>, <fpage>100323</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.wace.2021.100323</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ballarotta</surname> <given-names>M.</given-names></name>
<name><surname>Ubelmann</surname> <given-names>C.</given-names></name>
<name><surname>Bellemin-Laponnaz</surname> <given-names>V.</given-names></name>
<name><surname>Le Guillou</surname> <given-names>F.</given-names></name>
<name><surname>Meda</surname> <given-names>G.</given-names></name>
<name><surname>Anadon</surname> <given-names>C.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>Integrating wide-swath altimetry data into Level-4 multi-mission maps</article-title>. <source>Ocean. Sci.</source> <volume>21</volume>, <fpage>63</fpage>&#x2013;<lpage>80</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/os-21-63-2025</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Balmaseda</surname> <given-names>M. A.</given-names></name>
<name><surname>Alves</surname> <given-names>O. J.</given-names></name>
<name><surname>Arribas</surname> <given-names>A.</given-names></name>
<name><surname>Awaji</surname> <given-names>T.</given-names></name>
<name><surname>Behringer</surname> <given-names>D. W.</given-names></name>
<name><surname>Ferry</surname> <given-names>N.</given-names></name>
<etal/>
</person-group>. (<year>2009</year>). 
<article-title>Ocean initialization for seasonal forecasts</article-title>. <source>Oceanography</source> <volume>22</volume>, <fpage>154</fpage>&#x2013;<lpage>159</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5670/oceanog.2009.73</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Balmaseda</surname> <given-names>M. A.</given-names></name>
<name><surname>Dee</surname> <given-names>D.</given-names></name>
<name><surname>Vidard</surname> <given-names>A.</given-names></name>
<name><surname>Anderson</surname> <given-names>D. L.</given-names></name>
</person-group> (<year>2007</year>). 
<article-title>A multivariate treatment of bias for sequential data assimilation: Application to the tropical oceans</article-title>. <source>Q. J. R. Meteorol. Soc.</source> <volume>133</volume>, <fpage>167</fpage>&#x2013;<lpage>179</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/qj.12</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bannayan</surname> <given-names>M.</given-names></name>
<name><surname>Hoogenboom</surname> <given-names>G.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>Weather analogue: a tool for real-time prediction of daily weather data realizations based on a modified k-nearest neighbor approach</article-title>. <source>Environ. Model. Softw.</source> <volume>23</volume>, <fpage>703</fpage>&#x2013;<lpage>713</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.envsoft.2007.09.011</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bergen</surname> <given-names>R. E.</given-names></name>
<name><surname>Harnack</surname> <given-names>R. P.</given-names></name>
</person-group> (<year>1982</year>). 
<article-title>Long-range temperature prediction using a simple analog approach</article-title>. <source>Monthly. Weather. Rev.</source> <volume>110</volume>, <fpage>1083</fpage>&#x2013;<lpage>1099</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0493(1982)110&lt;1083:LRTPUA&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bloom</surname> <given-names>S.</given-names></name>
<name><surname>Takacs</surname> <given-names>L.</given-names></name>
<name><surname>da Silva</surname> <given-names>A.</given-names></name>
<name><surname>Ledvina</surname> <given-names>D.</given-names></name>
</person-group> (<year>1996</year>). 
<article-title>Data assimilation using incremental analysis updates</article-title>. <source>Monthly. Weather. Rev.</source> <volume>124</volume>, <fpage>1256</fpage>&#x2013;<lpage>1271</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0493(1996)124&lt;1256:DAUIAU&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
<name><surname>Sakov</surname> <given-names>P.</given-names></name>
<name><surname>Divakaran</surname> <given-names>P.</given-names></name>
<name><surname>Aijaz</surname> <given-names>S.</given-names></name>
<name><surname>Sweeney-Van Kinderen</surname> <given-names>J.</given-names></name>
<name><surname>Huang</surname> <given-names>X.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). &#x201c;
<article-title>OceanMAPS v4. 0i: a global eddy resolving EnKF ocean forecasting system</article-title>,&#x201d; in <source>OCEANS 2023-Limerick</source> (<publisher-loc>Piscataway, NJ, USA</publisher-loc>: 
<publisher-name>IEEE</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>8</lpage>.
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Browne</surname> <given-names>R. H.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>The t-test p value and its relationship to the effect size and P (X<italic>&gt;</italic>Y)</article-title>. <source>Am. Statistician.</source> <volume>64</volume>, <fpage>30</fpage>&#x2013;<lpage>33</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1198/tast.2010.08261</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bub</surname> <given-names>F. L.</given-names></name>
<name><surname>Mask</surname> <given-names>A. C.</given-names></name>
<name><surname>Wood</surname> <given-names>K. R.</given-names></name>
<name><surname>Krynen</surname> <given-names>D. G.</given-names></name>
<name><surname>Lunde</surname> <given-names>B. N.</given-names></name>
<name><surname>DeHAAN</surname> <given-names>C. J.</given-names></name>
<etal/>
</person-group>. (<year>2014</year>). 
<article-title>The Navy&#x2019;s application of ocean forecasting to decision support</article-title>. <source>Oceanography</source> <volume>27</volume>, <fpage>126</fpage>&#x2013;<lpage>137</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5670/oceanog.2014.74</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Burgers</surname> <given-names>G.</given-names></name>
<name><surname>Balmaseda</surname> <given-names>M. A.</given-names></name>
<name><surname>Vossepoel</surname> <given-names>F.</given-names></name>
<name><surname>van Oldenborgh</surname> <given-names>G.</given-names></name>
<name><surname>van Leeuwen</surname> <given-names>P. J.</given-names></name>
</person-group> (<year>2002</year>). 
<article-title>Balanced ocean-data assimilation near the equator</article-title>. <source>J. Phys. Oceanogr.</source> <volume>32</volume>, <fpage>2509</fpage>&#x2013;<lpage>2519</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0485-32.9.2509</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chamberlain</surname> <given-names>M.</given-names></name>
<name><surname>Oke</surname> <given-names>P.</given-names></name>
<name><surname>Brassington</surname> <given-names>G.</given-names></name>
<name><surname>Sandery</surname> <given-names>P.</given-names></name>
<name><surname>Divakaran</surname> <given-names>P.</given-names></name>
<name><surname>Fiedler</surname> <given-names>R.</given-names></name>
</person-group> (<year>2021</year>a). 
<article-title>Multiscale data assimilation in the Bluelink ocean reanalysis (BRAN)</article-title>. <source>Ocean. Model.</source> <volume>166</volume>, <fpage>101849</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2021.101849</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chamberlain</surname> <given-names>M. A.</given-names></name>
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Fiedler</surname> <given-names>R. A.</given-names></name>
<name><surname>Beggs</surname> <given-names>H. M.</given-names></name>
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
<name><surname>Divakaran</surname> <given-names>P.</given-names></name>
</person-group> (<year>2021</year>b). 
<article-title>Next generation of bluelink ocean reanalysis with multiscale data assimilation: Bran2020</article-title>. <source>Earth Syst. Sci. Data</source> <volume>13</volume>, <fpage>5663</fpage>&#x2013;<lpage>5688</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/essd-13-5663-2021</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chassignet</surname> <given-names>E. P.</given-names></name>
<name><surname>Hurlburt</surname> <given-names>H. E.</given-names></name>
<name><surname>Smedstad</surname> <given-names>O. M.</given-names></name>
<name><surname>Halliwell</surname> <given-names>G. R.</given-names></name>
<name><surname>Hogan</surname> <given-names>P. J.</given-names></name>
<name><surname>Wallcraft</surname> <given-names>A. J.</given-names></name>
<etal/>
</person-group>. (<year>2007</year>). 
<article-title>The HYCOM (hybrid coordinate ocean model) data assimilative system</article-title>. <source>J. Mar. Syst.</source> <volume>65</volume>, <fpage>60</fpage>&#x2013;<lpage>83</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jmarsys.2005.09.016</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Christiansen</surname> <given-names>B.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Ensemble averaging and the curse of dimensionality</article-title>. <source>J. Climate</source> <volume>31</volume>, <fpage>1587</fpage>&#x2013;<lpage>1596</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/JCLI-D-17-0197.1</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Ciliberti</surname> <given-names>S. A.</given-names></name>
<name><surname>Fanjul</surname> <given-names>E. A.</given-names></name>
<name><surname>Pearlman</surname> <given-names>J.</given-names></name>
<name><surname>Wilmer-Becker</surname> <given-names>K.</given-names></name>
<name><surname>Bahurel</surname> <given-names>P.</given-names></name>
<name><surname>Ardhuin</surname> <given-names>F.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). &#x201c;
<article-title>Evaluation of operational ocean forecasting systems from the perspective of the users and the experts</article-title>,&#x201d; in <source>7th edition of the Copernicus Ocean State Report (OSR7)</source>, Vol. <volume>2</volume>, <fpage>1</fpage>&#x2013;<lpage>osr7</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/sp-1-osr7-2-2023</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Counillon</surname> <given-names>F.</given-names></name>
<name><surname>Sakov</surname> <given-names>P.</given-names></name>
<name><surname>Bertino</surname> <given-names>L.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>Application of a hybrid enkf-oi to ocean forecasting</article-title>. <source>Ocean. Sci.</source> <volume>5</volume>, <fpage>389</fpage>&#x2013;<lpage>401</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/os-5-389-2009</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cover</surname> <given-names>T.</given-names></name>
<name><surname>Hart</surname> <given-names>P.</given-names></name>
</person-group> (<year>1967</year>). 
<article-title>Nearest neighbor pattern classification</article-title>. <source>IEEE Trans. Inf. Theory</source> <volume>13</volume>, <fpage>21</fpage>&#x2013;<lpage>27</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TIT.1967.1053964</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Daley</surname> <given-names>R.</given-names></name>
</person-group> (<year>1981</year>). 
<article-title>Normal mode initialization</article-title>. <source>Rev. Geophys.</source> <volume>19</volume>, <fpage>450</fpage>&#x2013;<lpage>468</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/RG019i003p00450</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Dee</surname> <given-names>D. P.</given-names></name>
<name><surname>Uppala</surname> <given-names>S.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>Variational bias correction of satellite radiance data in the ERA-interim reanalysis</article-title>. <source>Q. J. R. Meteorol. Soc.</source> <volume>135</volume>, <fpage>1830</fpage>&#x2013;<lpage>1841</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/qj.493</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Delle Monache</surname> <given-names>L.</given-names></name>
<name><surname>Eckel</surname> <given-names>F. A.</given-names></name>
<name><surname>Rife</surname> <given-names>D. L.</given-names></name>
<name><surname>Nagarajan</surname> <given-names>B.</given-names></name>
<name><surname>Searight</surname> <given-names>K.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Probabilistic weather prediction with an analog ensemble</article-title>. <source>Monthly. Weather. Rev.</source> <volume>141</volume>, <fpage>3498</fpage>&#x2013;<lpage>3516</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/MWR-D-12-00281.1</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Deng</surname> <given-names>Z.</given-names></name>
<name><surname>Zhu</surname> <given-names>X.</given-names></name>
<name><surname>Cheng</surname> <given-names>D.</given-names></name>
<name><surname>Zong</surname> <given-names>M.</given-names></name>
<name><surname>Zhang</surname> <given-names>S.</given-names></name>
</person-group> (<year>2016</year>). 
<article-title>Efficient kNN classification algorithm for big data</article-title>. <source>Neurocomputing</source> <volume>195</volume>, <fpage>143</fpage>&#x2013;<lpage>148</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.neucom.2015.08.112</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Dickson</surname> <given-names>T.</given-names></name>
<name><surname>Farr</surname> <given-names>H.</given-names></name>
<name><surname>Sear</surname> <given-names>D.</given-names></name>
<name><surname>Blake</surname> <given-names>J. I.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Uncertainty in marine weather routing</article-title>. <source>Appl. Ocean. Res.</source> <volume>88</volume>, <fpage>138</fpage>&#x2013;<lpage>146</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.apor.2019.04.008</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ding</surname> <given-names>M.</given-names></name>
<name><surname>Liu</surname> <given-names>H.</given-names></name>
<name><surname>Lin</surname> <given-names>P.</given-names></name>
<name><surname>Meng</surname> <given-names>Y.</given-names></name>
<name><surname>Zheng</surname> <given-names>W.</given-names></name>
<name><surname>An</surname> <given-names>B.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>A century-long eddy-resolving simulation of global oceanic large-and mesoscale state</article-title>. <source>Sci. Data</source> <volume>9</volume>, <fpage>691</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41597-022-01766-9</pub-id>, PMID: <pub-id pub-id-type="pmid">36369203</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ding</surname> <given-names>H.</given-names></name>
<name><surname>Newman</surname> <given-names>M.</given-names></name>
<name><surname>Alexander</surname> <given-names>M. A.</given-names></name>
<name><surname>Wittenberg</surname> <given-names>A. T.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Skillful climate forecasts of the tropical indo-pacific ocean using model-analogs</article-title>. <source>J. Climate</source> <volume>31</volume>, <fpage>5437</fpage>&#x2013;<lpage>5459</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/JCLI-D-17-0661.1</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ding</surname> <given-names>H.</given-names></name>
<name><surname>Newman</surname> <given-names>M.</given-names></name>
<name><surname>Alexander</surname> <given-names>M. A.</given-names></name>
<name><surname>Wittenberg</surname> <given-names>A. T.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>Relating CMIP5 model biases to seasonal forecast skill in the tropical Pacific</article-title>. <source>Geophys. Res. Lett.</source> <volume>47</volume>, <fpage>e2019GL086765</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2019GL086765</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Eckel</surname> <given-names>F. A.</given-names></name>
<name><surname>Delle Monache</surname> <given-names>L.</given-names></name>
</person-group> (<year>2016</year>). 
<article-title>A hybrid NWP&#x2013;analog ensemble</article-title>. <source>Monthly. Weather. Rev.</source> <volume>144</volume>, <fpage>897</fpage>&#x2013;<lpage>911</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/MWR-D-15-0096.1</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Evensen</surname> <given-names>G.</given-names></name>
</person-group> (<year>2003</year>). 
<article-title>The ensemble kalman filter: Theoretical formulation and practical implementation</article-title>. <source>Ocean. Dynamics.</source> <volume>53</volume>, <fpage>343</fpage>&#x2013;<lpage>367</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10236-003-0036-9</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ferry</surname> <given-names>N.</given-names></name>
<name><surname>Parent</surname> <given-names>L.</given-names></name>
<name><surname>Garric</surname> <given-names>G.</given-names></name>
<name><surname>Barnier</surname> <given-names>B.</given-names></name>
<name><surname>Jourdain</surname> <given-names>N. C</given-names></name>
</person-group>. (<year>2010</year>). 
<article-title>Mercator global Eddy permitting ocean reanalysis GLORYS1V1: Description and results</article-title>. <source>Mercator-Ocean. Q. Newslett.</source> <volume>36</volume>, <fpage>15</fpage>&#x2013;<lpage>27</lpage>.
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fix</surname> <given-names>E.</given-names></name>
<name><surname>Hodges</surname> <given-names>J. L.</given-names></name>
</person-group> (<year>1951</year>). 
<article-title>Discriminatory analysis, nonparametric discrimination</article-title>. <source>United. States Air. Force. School. Aviation. Med.</source> <volume>4</volume>, <fpage>February</fpage>.
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Green</surname> <given-names>D.</given-names></name>
<name><surname>Billy</surname> <given-names>J.</given-names></name>
<name><surname>Tapim</surname> <given-names>A.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>Indigenous Australians&#x2019; knowledge of weather and climate</article-title>. <source>Clim. Change</source> <volume>100</volume>, <fpage>337</fpage>&#x2013;<lpage>354</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10584-010-9803-z</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Griffies</surname> <given-names>S. M.</given-names></name>
</person-group> (<year>2009</year>). <source>Elements of MOM4p1, GFDL Ocean Group Technical Report 6. Tech. rep</source> (<publisher-loc>Princeton, NJ, USA</publisher-loc>: 
<publisher-name>NOAA/Geophysical Fluid Dynamics Laboratory</publisher-name>).
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Gul</surname> <given-names>N.</given-names></name>
<name><surname>Aamir</surname> <given-names>M.</given-names></name>
<name><surname>Aldahmani</surname> <given-names>S.</given-names></name>
<name><surname>Khan</surname> <given-names>Z.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>A weighted k-nearest neighbours ensemble with added accuracy and diversity</article-title>. <source>IEEE Access</source> <volume>10</volume>, <fpage>125920</fpage>&#x2013;<lpage>125929</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/ACCESS.2022.3225682</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hall</surname> <given-names>T. J.</given-names></name>
<name><surname>Thessin</surname> <given-names>R. N.</given-names></name>
<name><surname>Bloy</surname> <given-names>G. J.</given-names></name>
<name><surname>Mutchler</surname> <given-names>C. N.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>Analog sky condition forecasting based on a k-nn algorithm</article-title>. <source>Weather. forecast.</source> <volume>25</volume>, <fpage>1463</fpage>&#x2013;<lpage>1478</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/2010WAF2222372.1</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hamill</surname> <given-names>T. M.</given-names></name>
</person-group> (<year>2001</year>). 
<article-title>Interpretation of rank histograms for verifying ensemble forecasts</article-title>. <source>Monthly. Weather. Rev.</source> <volume>129</volume>, <fpage>550</fpage>&#x2013;<lpage>560</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0493(2001)129&lt;0550:IORHFV&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hamill</surname> <given-names>T. M.</given-names></name>
<name><surname>Whitaker</surname> <given-names>J. S.</given-names></name>
<name><surname>Mullen</surname> <given-names>S. L.</given-names></name>
</person-group> (<year>2006</year>). 
<article-title>Reforecasts: An important dataset for improving weather predictions</article-title>. <source>Bull. Am. Meteorol. Soc.</source> <volume>87</volume>, <fpage>33</fpage>&#x2013;<lpage>46</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/BAMS-87-1-33</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hattori</surname> <given-names>K.</given-names></name>
<name><surname>Takahashi</surname> <given-names>M.</given-names></name>
</person-group> (<year>1999</year>). 
<article-title>A new nearest-neighbor rule in the pattern classification problem</article-title>. <source>Pattern Recognit.</source> <volume>32</volume>, <fpage>425</fpage>&#x2013;<lpage>432</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0031-3203(98)00097-1</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="confproc">
<person-group person-group-type="author">
<name><surname>H&#xf6;llt</surname> <given-names>T.</given-names></name>
<name><surname>Magdy</surname> <given-names>A.</given-names></name>
<name><surname>Chen</surname> <given-names>G.</given-names></name>
<name><surname>Gopalakrishnan</surname> <given-names>G.</given-names></name>
<name><surname>Hoteit</surname> <given-names>I.</given-names></name>
<name><surname>Hansen</surname> <given-names>C. D.</given-names></name>
<etal/>
</person-group>. (<year>2013</year>). &#x201c;
<article-title>Visual analysis of uncertainties in ocean forecasts for planning and operation of off-shore structures</article-title>,&#x201d; in <conf-name>2013 IEEE Pacific Visualization Symposium (PacificVis)</conf-name>. <fpage>185</fpage>&#x2013;<lpage>192</lpage> (
<publisher-name>IEEE</publisher-name>). doi:&#xa0;<pub-id pub-id-type="doi">10.1109/PacificVis.2013.6596144</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hou</surname> <given-names>Z.</given-names></name>
<name><surname>Li</surname> <given-names>J.</given-names></name>
<name><surname>Wang</surname> <given-names>L.</given-names></name>
<name><surname>Zhang</surname> <given-names>Y.</given-names></name>
<name><surname>Liu</surname> <given-names>T.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Improving the forecast accuracy of ECMWF 2-m air temperature using a historical dataset</article-title>. <source>Atmosph. Res.</source> <volume>273</volume>, <fpage>106177</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.atmosres.2022.106177</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hou</surname> <given-names>Z.</given-names></name>
<name><surname>Li</surname> <given-names>J.</given-names></name>
<name><surname>Zuo</surname> <given-names>B.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Correction of monthly SST forecasts in CFSv2 using the local dynamical analog method</article-title>. <source>Weather. Forecast.</source> <volume>36</volume>, <fpage>843</fpage>&#x2013;<lpage>858</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/WAF-D-20-0123.1</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Houtekamer</surname> <given-names>P.</given-names></name>
<name><surname>Derome</surname> <given-names>J.</given-names></name>
</person-group> (<year>1995</year>). 
<article-title>Methods for ensemble prediction</article-title>. <source>Monthly. Weather. Rev.</source> <volume>123</volume>, <fpage>2181</fpage>&#x2013;<lpage>2196</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0493(1995)123&lt;2181:MFEP&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B46">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Imandoust</surname> <given-names>S. B.</given-names></name>
<name><surname>Bolandraftar</surname> <given-names>M</given-names></name>
</person-group>. (<year>2013</year>). 
<article-title>Application of k-Nearest Neighbor (kNN) approach for predicting economic events: Theoretical background</article-title>. <source>Int. J. Eng. Res. Appl.</source> <volume>3</volume>, <fpage>605</fpage>&#x2013;<lpage>610</lpage>.
</mixed-citation>
</ref>
<ref id="B47">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Junk</surname> <given-names>C.</given-names></name>
<name><surname>Delle Monache</surname> <given-names>L.</given-names></name>
<name><surname>Alessandrini</surname> <given-names>S.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>Analog-based ensemble model output statistics</article-title>. <source>Monthly. Weather. Rev.</source> <volume>143</volume>, <fpage>2909</fpage>&#x2013;<lpage>2917</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/MWR-D-15-0095.1</pub-id>
</mixed-citation>
</ref>
<ref id="B48">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Kalnay</surname> <given-names>E.</given-names></name>
<name><surname>Kanamitsu</surname> <given-names>M.</given-names></name>
<name><surname>Kistler</surname> <given-names>R.</given-names></name>
<name><surname>Collins</surname> <given-names>W.</given-names></name>
<name><surname>Deaven</surname> <given-names>D.</given-names></name>
<name><surname>Gandin</surname> <given-names>L.</given-names></name>
<etal/>
</person-group> (<year>2018</year>). 
<article-title>The NCEP/NCAR 40-year reanalysis project</article-title>. In <source>Renewable energy</source>. <publisher-loc>London UK</publisher-loc>: 
<publisher-name>Routledge</publisher-name> (Taylor &amp; Francis Group) <volume>1</volume>, <fpage>146</fpage>&#x2013;<lpage>194</lpage>.
</mixed-citation>
</ref>
<ref id="B49">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kharin</surname> <given-names>V. V.</given-names></name>
<name><surname>Zwiers</surname> <given-names>F. W.</given-names></name>
<name><surname>Zhang</surname> <given-names>X.</given-names></name>
<name><surname>Wehner</surname> <given-names>M.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Changes in temperature and precipitation extremes in the CMIP5 ensemble</article-title>. <source>Clim. Change</source> <volume>119</volume>, <fpage>345</fpage>&#x2013;<lpage>357</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10584-013-0705-8</pub-id>
</mixed-citation>
</ref>
<ref id="B50">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kiss</surname> <given-names>A. E.</given-names></name>
<name><surname>Hogg</surname> <given-names>A. M.</given-names></name>
<name><surname>Hannah</surname> <given-names>N.</given-names></name>
<name><surname>Boeira Dias</surname> <given-names>F.</given-names></name>
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
<name><surname>Chamberlain</surname> <given-names>M. A.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>ACCESS-OM2 v1. 0: a global ocean&#x2013;sea ice model at three resolutions</article-title>. <source>Geosci. Model. Dev.</source> <volume>13</volume>, <fpage>401</fpage>&#x2013;<lpage>442</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/gmd-13-401-2020</pub-id>
</mixed-citation>
</ref>
<ref id="B51">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kleist</surname> <given-names>D. T.</given-names></name>
<name><surname>Parrish</surname> <given-names>D. F.</given-names></name>
<name><surname>Derber</surname> <given-names>J. C.</given-names></name>
<name><surname>Treadon</surname> <given-names>R.</given-names></name>
<name><surname>Errico</surname> <given-names>R. M.</given-names></name>
<name><surname>Yang</surname> <given-names>R.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>Improving incremental balance in the GSI 3DVAR analysis system</article-title>. <source>Monthly. Weather. Rev.</source> <volume>137</volume>, <fpage>1046</fpage>&#x2013;<lpage>1060</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/2008MWR2623.1</pub-id>
</mixed-citation>
</ref>
<ref id="B52">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kobayashi</surname> <given-names>S.</given-names></name>
<name><surname>Ota</surname> <given-names>Y.</given-names></name>
<name><surname>Harada</surname> <given-names>Y.</given-names></name>
<name><surname>Ebita</surname> <given-names>A.</given-names></name>
<name><surname>Moriya</surname> <given-names>M.</given-names></name>
<name><surname>Onoda</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2015</year>). 
<article-title>The JRA-55 reanalysis: General specifications and basic characteristics</article-title>. <source>J. Meteorol. Soc. Japan. Ser. II</source> <volume>93</volume>, <fpage>5</fpage>&#x2013;<lpage>48</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2151/jmsj.2015-001</pub-id>
</mixed-citation>
</ref>
<ref id="B53">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kourafalou</surname> <given-names>V.</given-names></name>
<name><surname>De Mey</surname> <given-names>P.</given-names></name>
<name><surname>Staneva</surname> <given-names>J.</given-names></name>
<name><surname>Ayoub</surname> <given-names>N.</given-names></name>
<name><surname>Barth</surname> <given-names>A.</given-names></name>
<name><surname>Chao</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2015</year>). 
<article-title>Coastal Ocean Forecasting: science foundation and user benefits</article-title>. <source>J. Operat. Oceanogr.</source> <volume>8</volume>, <fpage>s147</fpage>&#x2013;<lpage>s167</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/1755876X.2015.1022348</pub-id>
</mixed-citation>
</ref>
<ref id="B54">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kumar</surname> <given-names>P. S.</given-names></name>
<name><surname>Pillai</surname> <given-names>G. N.</given-names></name>
<name><surname>Manjusha</surname> <given-names>U.</given-names></name>
</person-group> (<year>2014</year>). 
<article-title>El Nino southern oscillation (ENSO) impact on tuna fisheries in Indian Ocean</article-title>. <source>SpringerPlus</source> <volume>3</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/2193-1801-3-591</pub-id>, PMID: <pub-id pub-id-type="pmid">26034673</pub-id>
</mixed-citation>
</ref>
<ref id="B55">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kuonen</surname> <given-names>J.</given-names></name>
<name><surname>Conway</surname> <given-names>F.</given-names></name>
<name><surname>Strub</surname> <given-names>T.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Relating ocean condition forecasts to the process of end-user decision making: A case study of the Oregon commercial fishing community</article-title>. <source>Mar. Technol. Soc. J.</source> <volume>53</volume>, <fpage>53</fpage>&#x2013;<lpage>66</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4031/MTSJ.53.1.1</pub-id>, PMID: <pub-id pub-id-type="pmid">33204041</pub-id>
</mixed-citation>
</ref>
<ref id="B56">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Langmack</surname> <given-names>H.</given-names></name>
<name><surname>Fraedrich</surname> <given-names>K.</given-names></name>
<name><surname>Sielmann</surname> <given-names>F.</given-names></name>
</person-group> (<year>2012</year>). 
<article-title>Tropical cyclone track analog ensemble forecasting in the extended Australian basin: NWP combinations</article-title>. <source>Q. J. R. Meteorol. Soc.</source> <volume>138</volume>, <fpage>1828</fpage>&#x2013;<lpage>1838</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/qj.1915</pub-id>
</mixed-citation>
</ref>
<ref id="B57">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lorenz</surname> <given-names>E. N.</given-names></name>
</person-group> (<year>1969</year>). 
<article-title>Atmospheric predictability as revealed by naturally occurring analogues</article-title>. <source>J. Atmosph. Sci.</source> <volume>26</volume>, <fpage>636</fpage>&#x2013;<lpage>646</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0469(1969)26&lt;636:APARBN&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B58">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lubchenco</surname> <given-names>J.</given-names></name>
<name><surname>McNutt</surname> <given-names>M. K.</given-names></name>
<name><surname>Dreyfus</surname> <given-names>G.</given-names></name>
<name><surname>Murawski</surname> <given-names>S. A.</given-names></name>
<name><surname>Kennedy</surname> <given-names>D. M.</given-names></name>
<name><surname>Anastas</surname> <given-names>P. T.</given-names></name>
<etal/>
</person-group>. (<year>2012</year>). 
<article-title>Science in support of the Deepwater Horizon response</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>109</volume>, <fpage>20212</fpage>&#x2013;<lpage>20221</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1204729109</pub-id>, PMID: <pub-id pub-id-type="pmid">23213250</pub-id>
</mixed-citation>
</ref>
<ref id="B59">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lynch</surname> <given-names>P.</given-names></name>
<name><surname>Huang</surname> <given-names>X.-Y.</given-names></name>
</person-group> (<year>1992</year>). 
<article-title>Initialization of the HIRLAM model using a digital filter</article-title>. <source>Monthly. Weather. Rev.</source> <volume>120</volume>, <fpage>1019</fpage>&#x2013;<lpage>1034</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0493(1992)120&lt;1019:IOTHMU&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B60">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Madec</surname> <given-names>G.</given-names></name>
</person-group> (<year>2016</year>). &#x201c;
<article-title>NEMO ocean engine</article-title>,&#x201d; in <source>Scientific notes of climate modelling center</source>. <publisher-loc>Paris, France</publisher-loc>: 
<publisher-name>Institut Pierre&#x2011;Simon Laplace (IPSL)</publisher-name><volume>27</volume>, <fpage>1288</fpage>.
</mixed-citation>
</ref>
<ref id="B61">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Malanotte-Rizzoli</surname> <given-names>P.</given-names></name>
<name><surname>Young</surname> <given-names>R. E.</given-names></name>
<name><surname>Haidvogel</surname> <given-names>D. B.</given-names></name>
</person-group> (<year>1989</year>). 
<article-title>Initialization and data assimilation experiments with a primitive equation model</article-title>. <source>Dynamics. Atmospheres. Oceans.</source> <volume>13</volume>, <fpage>349</fpage>&#x2013;<lpage>378</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0377-0265(89)90046-8</pub-id>
</mixed-citation>
</ref>
<ref id="B62">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Martin</surname> <given-names>M.</given-names></name>
<name><surname>Bell</surname> <given-names>M.</given-names></name>
<name><surname>Nichols</surname> <given-names>N. K.</given-names></name>
</person-group> (<year>2002</year>). 
<article-title>Estimation of systematic error in an equatorial ocean model using data assimilation</article-title>. <source>Int. J. Numerical. Methods Fluids.</source> <volume>40</volume>, <fpage>435</fpage>&#x2013;<lpage>444</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/fld.298</pub-id>
</mixed-citation>
</ref>
<ref id="B63">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Masumoto</surname> <given-names>Y.</given-names></name>
<name><surname>Sasaki</surname> <given-names>H.</given-names></name>
<name><surname>Kagimoto</surname> <given-names>T.</given-names></name>
<name><surname>Komori</surname> <given-names>N.</given-names></name>
<name><surname>Ishida</surname> <given-names>A.</given-names></name>
<name><surname>Sasai</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2004</year>). 
<article-title>A fifty-year eddy-resolving simulation of the world ocean: Preliminary outcomes of OFES (OGCM for the Earth Simulator)</article-title>. <source>J. Earth Simulator.</source> <volume>1</volume>, <fpage>35</fpage>&#x2013;<lpage>56</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/gmd-13-3319-2020</pub-id>
</mixed-citation>
</ref>
<ref id="B64">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Middleton</surname> <given-names>J. F.</given-names></name>
<name><surname>Bye</surname> <given-names>J. A.</given-names></name>
</person-group> (<year>2007</year>). 
<article-title>A review of the shelf-slope circulation along Australia&#x2019;s southern shelves: Cape Leeuwin to Portland</article-title>. <source>Prog. Oceanogr.</source> <volume>75</volume>, <fpage>1</fpage>&#x2013;<lpage>41</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pocean.2007.07.001</pub-id>
</mixed-citation>
</ref>
<ref id="B65">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mirouze</surname> <given-names>I.</given-names></name>
<name><surname>R&#xe9;my</surname> <given-names>E.</given-names></name>
<name><surname>Lellouche</surname> <given-names>J.-M.</given-names></name>
<name><surname>Martin</surname> <given-names>M. J.</given-names></name>
<name><surname>Donlon</surname> <given-names>C. J.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Impact of assimilating satellite surface velocity observations in the Mercator Ocean International analysis and forecasting global 1/4<sup>&#x25e6;</sup> system</article-title>. <source>Front. Mar. Sci.</source> <volume>11</volume>, <elocation-id>1376999</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2024.1376999</pub-id>
</mixed-citation>
</ref>
<ref id="B66">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mitchell</surname> <given-names>H. L.</given-names></name>
<name><surname>Houtekamer</surname> <given-names>P. L.</given-names></name>
<name><surname>Pellerin</surname> <given-names>G.</given-names></name>
</person-group> (<year>2002</year>). 
<article-title>Ensemble size, balance, and model-error representation in an ensemble Kalman filter</article-title>. <source>Monthly. Weather. Rev.</source> <volume>130</volume>, <fpage>2791</fpage>&#x2013;<lpage>2808</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0493(2002)130&lt;2791:ESBAME&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B67">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Murphy</surname> <given-names>A. H.</given-names></name>
</person-group> (<year>1996</year>). 
<article-title>General decompositions of MSE-based skill scores: Measures of some basic aspects of forecast quality</article-title>. <source>Monthly. Weather. Rev.</source> <volume>124</volume>, <fpage>2353</fpage>&#x2013;<lpage>2369</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0493(1996)124&lt;2353:GDOMBS&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B68">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Nagarajan</surname> <given-names>B.</given-names></name>
<name><surname>Delle Monache</surname> <given-names>L.</given-names></name>
<name><surname>Hacker</surname> <given-names>J. P.</given-names></name>
<name><surname>Rife</surname> <given-names>D. L.</given-names></name>
<name><surname>Searight</surname> <given-names>K.</given-names></name>
<name><surname>Knievel</surname> <given-names>J. C.</given-names></name>
<etal/>
</person-group>. (<year>2015</year>). 
<article-title>An evaluation of analog-based postprocessing methods across several variables and forecast models</article-title>. <source>Weather. Forecast.</source> <volume>30</volume>, <fpage>1623</fpage>&#x2013;<lpage>1643</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/WAF-D-14-00081.1</pub-id>
</mixed-citation>
</ref>
<ref id="B69">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>O&#x2019;Kane</surname> <given-names>T. J.</given-names></name>
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Sandery</surname> <given-names>P. A.</given-names></name>
</person-group> (<year>2011</year>). 
<article-title>Predicting the East Australian current</article-title>. <source>Ocean. Model.</source> <volume>38</volume>, <fpage>251</fpage>&#x2013;<lpage>266</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2011.04.003</pub-id>
</mixed-citation>
</ref>
<ref id="B70">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Allen</surname> <given-names>J.</given-names></name>
<name><surname>Miller</surname> <given-names>R.</given-names></name>
<name><surname>Egbert</surname> <given-names>G.</given-names></name>
<name><surname>Austin</surname> <given-names>J.</given-names></name>
<name><surname>Barth</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2002</year>a). 
<article-title>A modeling study of the three-dimensional continental shelf circulation off Oregon. Part I: Model&#x2013;data comparisons</article-title>. <source>J. Phys. Oceanogr.</source> <volume>32</volume>, <fpage>1360</fpage>&#x2013;<lpage>1382</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0485(2002)032&lt;1360:AMSOTT&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B71">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Allen</surname> <given-names>J. S.</given-names></name>
<name><surname>Miller</surname> <given-names>R. N.</given-names></name>
<name><surname>Egbert</surname> <given-names>G. D.</given-names></name>
<name><surname>Kosro</surname> <given-names>P. M.</given-names></name>
</person-group> (<year>2002</year>b). 
<article-title>Assimilation of surface velocity data into a primitive equation coastal ocean model</article-title>. <source>J. Geophys. Res.: Oceans.</source> <volume>107</volume>, <fpage>5</fpage>&#x2013;<lpage>1</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2000JC000511</pub-id>
</mixed-citation>
</ref>
<ref id="B72">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
<name><surname>Griffin</surname> <given-names>D. A.</given-names></name>
<name><surname>Schiller</surname> <given-names>A.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>The Bluelink ocean data assimilation system (BODAS)</article-title>. <source>Ocean. Model.</source> <volume>21</volume>, <fpage>46</fpage>&#x2013;<lpage>70</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2007.11.002</pub-id>
</mixed-citation>
</ref>
<ref id="B73">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
<name><surname>Griffin</surname> <given-names>D. A.</given-names></name>
<name><surname>Schiller</surname> <given-names>A.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>Ocean data assimilation: a case for ensemble optimal interpolation</article-title>. <source>Aust. Meteorol. Ocean.</source> <volume>59</volume>, <fpage>67</fpage>&#x2013;<lpage>76</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.22499/2.5901.008</pub-id>
</mixed-citation>
</ref>
<ref id="B74">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Chamberlain</surname> <given-names>M. A.</given-names></name>
<name><surname>Fiedler</surname> <given-names>R. A.</given-names></name>
<name><surname>Bastos de Oliveira</surname> <given-names>H.</given-names></name>
<name><surname>Beggs</surname> <given-names>H. M.</given-names></name>
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Combining Argo and satellite data using model-derived covariances: Blue Maps</article-title>. <source>Front. Earth Sci.</source> <volume>9</volume>, <elocation-id>485</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/feart.2021.696985</pub-id>
</mixed-citation>
</ref>
<ref id="B75">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Griffin</surname> <given-names>D. A.</given-names></name>
<name><surname>Schiller</surname> <given-names>A.</given-names></name>
<name><surname>Matear</surname> <given-names>R.</given-names></name>
<name><surname>Fiedler</surname> <given-names>R.</given-names></name>
<name><surname>Mansbridge</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2013</year>). 
<article-title>Evaluation of a near-global eddy-resolving ocean model</article-title>. <source>Geosci. Model. Dev.</source> <volume>6</volume>, <fpage>591</fpage>&#x2013;<lpage>615</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/gmd-6-591-2013</pub-id>
</mixed-citation>
</ref>
<ref id="B76">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Sakov</surname> <given-names>P.</given-names></name>
<name><surname>Corney</surname> <given-names>S. P.</given-names></name>
</person-group> (<year>2007</year>). 
<article-title>Impacts of localisation in the EnKF and EnOI: experiments with a small model</article-title>. <source>Ocean. Dynamics.</source> <volume>57</volume>, <fpage>32</fpage>&#x2013;<lpage>45</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10236-006-0088-8</pub-id>
</mixed-citation>
</ref>
<ref id="B77">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Peng</surname> <given-names>Y.</given-names></name>
<name><surname>Liu</surname> <given-names>X.</given-names></name>
<name><surname>Su</surname> <given-names>J.</given-names></name>
<name><surname>Liu</surname> <given-names>X.</given-names></name>
<name><surname>Zhang</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Skill improvement of the yearly updated reforecasts in ECMWF S2S prediction from 2016 to 2022</article-title>. <source>Atmosph. Oceanic. Sci. Lett.</source> <volume>16</volume>, <fpage>100357</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.aosl.2023.100357</pub-id>
</mixed-citation>
</ref>
<ref id="B78">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pestov</surname> <given-names>V.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>Is the k-NN classifier in high dimensions affected by the curse of dimensionality</article-title>? <source>Comput. Math. Appl.</source> <volume>65</volume>, <fpage>1427</fpage>&#x2013;<lpage>1437</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.camwa.2012.09.011</pub-id>
</mixed-citation>
</ref>
<ref id="B79">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pilo</surname> <given-names>G. S.</given-names></name>
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Coleman</surname> <given-names>R.</given-names></name>
<name><surname>Rykova</surname> <given-names>T.</given-names></name>
<name><surname>Ridgway</surname> <given-names>K.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Impact of data assimilation on vertical velocities in an eddy resolving ocean model</article-title>. <source>Ocean. Model.</source> <volume>131</volume>, <fpage>71</fpage>&#x2013;<lpage>85</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2018.09.003</pub-id>
</mixed-citation>
</ref>
<ref id="B80">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Platzer</surname> <given-names>P.</given-names></name>
<name><surname>Chapron</surname> <given-names>B.</given-names></name>
</person-group> (<year>2024</year>). &#x201c;
<article-title>Analogue forecasting ensembles</article-title>,&#x201d; in <source>STOCHASTIC TRANSPORT IN <italic>UPPER OCEAN DYNAMICS III: Stuod 2023 Workshop</italic></source> (<publisher-loc>Cham, Switzerland</publisher-loc>: 
<publisher-name>Springer Nature</publisher-name>), <fpage>223</fpage>.
</mixed-citation>
</ref>
<ref id="B81">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Poli</surname> <given-names>P.</given-names></name>
<name><surname>Hersbach</surname> <given-names>H.</given-names></name>
<name><surname>Dee</surname> <given-names>D. P.</given-names></name>
<name><surname>Berrisford</surname> <given-names>P.</given-names></name>
<name><surname>Simmons</surname> <given-names>A. J.</given-names></name>
<name><surname>Vitart</surname> <given-names>F.</given-names></name>
<etal/>
</person-group>. (<year>2016</year>). 
<article-title>ERA-20C: An atmospheric reanalysis of the twentieth century</article-title>. <source>J. Climate</source> <volume>29</volume>, <fpage>4083</fpage>&#x2013;<lpage>4097</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/JCLI-D-15-0556.1</pub-id>
</mixed-citation>
</ref>
<ref id="B82">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Raghukumar</surname> <given-names>K.</given-names></name>
<name><surname>Edwards</surname> <given-names>C. A.</given-names></name>
<name><surname>Goebel</surname> <given-names>N. L.</given-names></name>
<name><surname>Broquet</surname> <given-names>G.</given-names></name>
<name><surname>Veneziani</surname> <given-names>M.</given-names></name>
<name><surname>Moore</surname> <given-names>A. M.</given-names></name>
<etal/>
</person-group>. (<year>2015</year>). 
<article-title>Impact of assimilating physical oceanographic data on modeled ecosystem dynamics in the California Current System</article-title>. <source>Prog. Oceanogr.</source> <volume>138</volume>, <fpage>546</fpage>&#x2013;<lpage>558</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pocean.2015.01.004</pub-id>
</mixed-citation>
</ref>
<ref id="B83">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Raja</surname> <given-names>K. J.</given-names></name>
<name><surname>Buijsman</surname> <given-names>M. C.</given-names></name>
<name><surname>Bozec</surname> <given-names>A.</given-names></name>
<name><surname>Helber</surname> <given-names>R. W.</given-names></name>
<name><surname>Shriver</surname> <given-names>J. F.</given-names></name>
<name><surname>Wallcraft</surname> <given-names>A.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Spurious internal wave generation during data assimilation in eddy resolving ocean model simulations</article-title>. <source>Ocean. Model.</source> <volume>188</volume>, <fpage>102340</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2024.102340</pub-id>
</mixed-citation>
</ref>
<ref id="B84">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rautenbach</surname> <given-names>C.</given-names></name>
<name><surname>Blair</surname> <given-names>B.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>Marine meteorological forecasts for coastal ocean users&#x2013;perceptions, usability and uptake</article-title>. <source>Geosci. Commun. Discuss.</source> <volume>2021</volume>, <fpage>1</fpage>&#x2013;<lpage>29</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/gc-4-361-2021</pub-id>
</mixed-citation>
</ref>
<ref id="B85">
<mixed-citation publication-type="confproc">
<person-group person-group-type="author">
<name><surname>Rosebrock</surname> <given-names>U.</given-names></name>
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Carroll</surname> <given-names>G.</given-names></name>
</person-group> (<year>2015</year>). &#x201c;
<article-title>An application framework for the rapid deployment of ocean models in support of emergency services: Application to the MH370 search</article-title>,&#x201d; In <conf-name>Environmental Software Systems. Infrastructures, Services and Applications: 11th IFIP WG 5.11 International Symposium, ISESS 2015</conf-name>, <conf-loc>Melbourne, VIC, Australia</conf-loc>, <conf-date>March 25-27, 2015</conf-date>. Proceedings, IFIP Advances in Information and Communication Technology <volume>448</volume> (
<publisher-name>Springer</publisher-name>), <fpage>235</fpage>&#x2013;<lpage>241</lpage>.
</mixed-citation>
</ref>
<ref id="B86">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ryan</surname> <given-names>A.</given-names></name>
<name><surname>Regnier</surname> <given-names>C.</given-names></name>
<name><surname>Divakaran</surname> <given-names>P.</given-names></name>
<name><surname>Spindler</surname> <given-names>T.</given-names></name>
<name><surname>Mehra</surname> <given-names>A.</given-names></name>
<name><surname>Smith</surname> <given-names>G.</given-names></name>
<etal/>
</person-group>. (<year>2015</year>). 
<article-title>GODAE OceanView Class 4 forecast verification framework: global ocean inter-comparison</article-title>. <source>J. Operat. Oceanogr.</source> <volume>8</volume>, <fpage>s98</fpage>&#x2013;<lpage>s111</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/1755876X.2015.1022330</pub-id>
</mixed-citation>
</ref>
<ref id="B87">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rykova</surname> <given-names>T.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Improving forecasts of individual ocean eddies using feature mapping</article-title>. <source>Sci. Rep.</source> <volume>13</volume>, <fpage>6216</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-023-33465-9</pub-id>, PMID: <pub-id pub-id-type="pmid">37069250</pub-id>
</mixed-citation>
</ref>
<ref id="B88">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sakov</surname> <given-names>P.</given-names></name>
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>A deterministic formulation of the ensemble kalman filter: an alternative to ensemble square root filters</article-title>. <source>Tellus. A.: Dynamic. Meteorol. Oceanogr.</source> <volume>60</volume>, <fpage>361</fpage>&#x2013;<lpage>371</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1600-0870.2007.00299.x</pub-id>
</mixed-citation>
</ref>
<ref id="B89">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sakov</surname> <given-names>P.</given-names></name>
<name><surname>Sandery</surname> <given-names>P. A.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>Comparison of EnOI and EnKF regional ocean reanalysis systems</article-title>. <source>Ocean. Model.</source> <volume>89</volume>, <fpage>45</fpage>&#x2013;<lpage>60</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2015.02.003</pub-id>
</mixed-citation>
</ref>
<ref id="B90">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sandery</surname> <given-names>P. A.</given-names></name>
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
<name><surname>Freeman</surname> <given-names>J.</given-names></name>
</person-group> (<year>2011</year>). 
<article-title>Adaptive nonlinear dynamical initialization</article-title>. <source>J. Geophys. Res.: Oceans.</source> <volume>116</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2010JC006260</pub-id>
</mixed-citation>
</ref>
<ref id="B91">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sasaki</surname> <given-names>H.</given-names></name>
<name><surname>Kida</surname> <given-names>S.</given-names></name>
<name><surname>Furue</surname> <given-names>R.</given-names></name>
<name><surname>Aiki</surname> <given-names>H.</given-names></name>
<name><surname>Komori</surname> <given-names>N.</given-names></name>
<name><surname>Masumoto</surname> <given-names>Y.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>A global eddying hindcast ocean simulation with OFES2</article-title>. <source>Geosci. Model. Dev.</source> <volume>13</volume>, <fpage>3319</fpage>&#x2013;<lpage>3336</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/gmd-13-3319-2020</pub-id>
</mixed-citation>
</ref>
<ref id="B92">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Scharroo</surname> <given-names>R.</given-names></name>
</person-group> (<year>2018</year>). <source>RADS data manual</source>. <publisher-loc>Netherlands</publisher-loc>: 
<publisher-name>TUDelft</publisher-name>.
</mixed-citation>
</ref>
<ref id="B93">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Scharroo</surname> <given-names>R.</given-names></name>
<name><surname>Leuliette</surname> <given-names>E.</given-names></name>
<name><surname>Lillibridge</surname> <given-names>J.</given-names></name>
<name><surname>Byrne</surname> <given-names>D.</given-names></name>
<name><surname>Naeije</surname> <given-names>M.</given-names></name>
<name><surname>Mitchum</surname> <given-names>G.</given-names></name>
</person-group> (<year>2013</year>). &#x201c;
<article-title>RADS: consistent multi-mission products</article-title>,&#x201d; in <source>20 Years of Progress in Radar Altimatry</source>, vol. <volume>710</volume> . Ed. 
<person-group person-group-type="editor">
<name><surname>Ouwehand</surname> <given-names>L.</given-names></name>
</person-group> (<publisher-loc>Noordwijk, The Netherlands</publisher-loc>: 
<publisher-name>of ESA Special Publication</publisher-name>), <fpage>69</fpage>.
</mixed-citation>
</ref>
<ref id="B94">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Schiller</surname> <given-names>A.</given-names></name>
<name><surname>Brassington</surname> <given-names>G. B.</given-names></name>
<name><surname>Oke</surname> <given-names>P. R.</given-names></name>
<name><surname>Cahill</surname> <given-names>M.</given-names></name>
<name><surname>Divakaran</surname> <given-names>P.</given-names></name>
<name><surname>Entel</surname> <given-names>M.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>Bluelink ocean forecasting Australia: 15 years of operational ocean service delivery with societal, economic and environmental benefits</article-title>. <source>J. Operat. Oceanogr.</source> <volume>13</volume>, <fpage>1</fpage>&#x2013;<lpage>18</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/1755876X.2019.1685834</pub-id>
</mixed-citation>
</ref>
<ref id="B95">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Siedlecki</surname> <given-names>S. A.</given-names></name>
<name><surname>Alin</surname> <given-names>S. R.</given-names></name>
<name><surname>Norton</surname> <given-names>E. L.</given-names></name>
<name><surname>Bond</surname> <given-names>N. A.</given-names></name>
<name><surname>Hermann</surname> <given-names>A. J.</given-names></name>
<name><surname>Feely</surname> <given-names>R. A.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Can seasonal forecasts of ocean conditions aid fisheries managers</article-title>? <source>Oceanography</source> <volume>36</volume>, <fpage>158</fpage>&#x2013;<lpage>167</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5670/oceanog.2023.219</pub-id>
</mixed-citation>
</ref>
<ref id="B96">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Smith</surname> <given-names>N.</given-names></name>
</person-group> (<year>2000</year>). 
<article-title>The global ocean data assimilation experiment</article-title>. <source>Adv. Space. Res.</source> <volume>25</volume>, <fpage>1089</fpage>&#x2013;<lpage>1098</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0273-1177(99)00868-6</pub-id>
</mixed-citation>
</ref>
<ref id="B97">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Spillman</surname> <given-names>C. M.</given-names></name>
<name><surname>Hobday</surname> <given-names>A. J.</given-names></name>
<name><surname>Behrens</surname> <given-names>E.</given-names></name>
<name><surname>Feng</surname> <given-names>M.</given-names></name>
<name><surname>Capotondi</surname> <given-names>A.</given-names></name>
<name><surname>Cravatte</surname> <given-names>S.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>What makes a marine heatwave forecast useable, useful and used</article-title>? <source>Prog. Oceanogr.</source> <volume>234</volume>, <elocation-id>103464</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.pocean.2025.103464</pub-id>
</mixed-citation>
</ref>
<ref id="B98">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Stewart</surname> <given-names>K.</given-names></name>
<name><surname>Kim</surname> <given-names>W.</given-names></name>
<name><surname>Urakawa</surname> <given-names>S.</given-names></name>
<name><surname>Hogg</surname> <given-names>A. M.</given-names></name>
<name><surname>Yeager</surname> <given-names>S.</given-names></name>
<name><surname>Tsujino</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>JRA55-do-based repeat year forcing datasets for driving ocean&#x2013;sea-ice models</article-title>. <source>Ocean. Model.</source> <volume>147</volume>, <fpage>101557</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ocemod.2019.101557</pub-id>
</mixed-citation>
</ref>
<ref id="B99">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Temperton</surname> <given-names>C.</given-names></name>
<name><surname>Williamson</surname> <given-names>D. L.</given-names></name>
</person-group> (<year>1981</year>). 
<article-title>Normal mode initialization for a multilevel grid-point model. Part I: Linear aspects</article-title>. <source>Monthly. Weather. Rev.</source> <volume>109</volume>, <fpage>729</fpage>&#x2013;<lpage>743</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/1520-0493(1981)109&lt;0729:NMIFAM&gt;2.0.CO;2</pub-id>
</mixed-citation>
</ref>
<ref id="B100">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Van den Dool</surname> <given-names>H. M.</given-names></name>
</person-group> (<year>2007</year>). <source>Empirical methods in short-term climate prediction</source> (<publisher-loc>Oxford, England, UK</publisher-loc>: 
<publisher-name>Oxford University Press</publisher-name>).
</mixed-citation>
</ref>
<ref id="B101">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Vidgen</surname> <given-names>B.</given-names></name>
<name><surname>Yasseri</surname> <given-names>T.</given-names></name>
</person-group> (<year>2016</year>). 
<article-title>P-values: misunderstood and misused</article-title>. <source>Front. Phys.</source> <volume>4</volume>, <elocation-id>6</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fphy.2016.00006</pub-id>
</mixed-citation>
</ref>
<ref id="B102">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Walsh</surname> <given-names>J. E.</given-names></name>
<name><surname>Brettschneider</surname> <given-names>B.</given-names></name>
<name><surname>Kettle</surname> <given-names>N. P.</given-names></name>
<name><surname>Thoman</surname> <given-names>R. L.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>An analog method for seasonal forecasting in northern high latitudes</article-title>. <source>Atmosph. Climate Sci.</source> <volume>11</volume>, <fpage>469</fpage>&#x2013;<lpage>485</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4236/acs.2021.113028</pub-id>
</mixed-citation>
</ref>
<ref id="B103">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>X.</given-names></name>
<name><surname>Li</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2022</year>). 
<article-title>Facial recognition system based on genetic algorithm improved ROI-KNN convolutional neural network</article-title>. <source>Appl. Bionics. Biomech.</source> <volume>2022</volume>, <fpage>7976856</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2022/7976856</pub-id>, PMID: <pub-id pub-id-type="pmid">36263255</pub-id>
</mixed-citation>
</ref>
<ref id="B104">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Waters</surname> <given-names>J.</given-names></name>
<name><surname>Bell</surname> <given-names>M.</given-names></name>
<name><surname>Martin</surname> <given-names>M.</given-names></name>
<name><surname>Lea</surname> <given-names>D.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>Reducing ocean model imbalances in the equatorial region caused by data assimilation</article-title>. <source>Q. J. R. Meteorol. Soc.</source> <volume>143</volume>, <fpage>195</fpage>&#x2013;<lpage>208</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/qj.2912</pub-id>
</mixed-citation>
</ref>
<ref id="B105">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xie</surname> <given-names>T.</given-names></name>
<name><surname>Chen</surname> <given-names>L.</given-names></name>
<name><surname>Yi</surname> <given-names>B.</given-names></name>
<name><surname>Li</surname> <given-names>S.</given-names></name>
<name><surname>Leng</surname> <given-names>Z.</given-names></name>
<name><surname>Gan</surname> <given-names>X.</given-names></name>
<etal/>
</person-group>. (<year>2024</year>). 
<article-title>Application of the improved k-nearest neighbor-based multi-model ensemble method for runoff prediction</article-title>. <source>Water</source> <volume>16</volume>, <fpage>69</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/w16010069</pub-id>
</mixed-citation>
</ref>
<ref id="B106">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xing</surname> <given-names>W.</given-names></name>
<name><surname>Bei</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Medical health big data classification based on kNN classification algorithm</article-title>. <source>IEEE Access</source> <volume>8</volume>, <fpage>28808</fpage>&#x2013;<lpage>28819</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/ACCESS.2019.2955754</pub-id>
</mixed-citation>
</ref>
<ref id="B107">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xing</surname> <given-names>Q.</given-names></name>
<name><surname>Yu</surname> <given-names>H.</given-names></name>
<name><surname>Wang</surname> <given-names>H.</given-names></name>
<name><surname>Ito</surname> <given-names>S.-i.</given-names></name>
<name><surname>Chai</surname> <given-names>F.</given-names></name>
</person-group> (<year>2023</year>). 
<article-title>Mesoscale eddies modulate the dynamics of human fishing activities in the global midlatitude ocean</article-title>. <source>Fish. Fish.</source> <volume>24</volume>, <fpage>527</fpage>&#x2013;<lpage>543</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/faf.12742</pub-id>
</mixed-citation>
</ref>
<ref id="B108">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>S.</given-names></name>
<name><surname>Li</surname> <given-names>X.</given-names></name>
<name><surname>Zong</surname> <given-names>M.</given-names></name>
<name><surname>Zhu</surname> <given-names>X.</given-names></name>
<name><surname>Cheng</surname> <given-names>D.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>Learning k for kNN classification</article-title>. <source>ACM Trans. Intell. Syst. Technol. (TIST).</source> <volume>8</volume>, <fpage>1</fpage>&#x2013;<lpage>19</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/2990508</pub-id>
</mixed-citation>
</ref>
<ref id="B109">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>X.</given-names></name>
<name><surname>Oke</surname> <given-names>P.</given-names></name>
<name><surname>Feng</surname> <given-names>M.</given-names></name>
<name><surname>Chamberlain</surname> <given-names>M.</given-names></name>
<name><surname>Church</surname> <given-names>J.</given-names></name>
<name><surname>Monselesan</surname> <given-names>D.</given-names></name>
<etal/>
</person-group>. (<year>2016</year>). 
<article-title>A near-global eddy-resolving OGCM for climate studies</article-title>. <source>Geosci. Model. Dev. Discuss.</source> <volume>2016</volume>, <fpage>1</fpage>&#x2013;<lpage>52</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/gmd-2016-17</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/342712">Chunyan Li</ext-link>, Louisiana State University, United States</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/947564">Mihailov Maria Emanuela</ext-link>, Maritime Hydrographic Directorate, Romania</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2693223">Aleksei V. Buinyi</ext-link>, Marine Information Technologies LLC, Russia</p></fn>
</fn-group>
</back>
</article>