<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2023.1260047</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Marine Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Optimization of the k-nearest-neighbors model for summer Arctic Sea ice prediction</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Lin</surname>
<given-names>Yongcheng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2379013"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Qinghua</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/602570"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Xuewei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2247404"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Chao-Yuan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1988121"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Yiguo</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1354088"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Jiuke</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2542826"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Jingwen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2381217"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Sizhe</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2397356"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Jiping</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/975765"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>School of Atmospheric Sciences, Sun Yat-Sen University, and Southern Marine Science and Engineering Guangdong Laboratory</institution>, <addr-line>Zhuhai</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>State Key Laboratory of Coastal and Offshore Engineering, Dalian University of Technology</institution>, <addr-line>Dalian</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Nansen Environmental and Remote Sensing Center and Berknes Centre for Climate Research</institution>, <addr-line>Bergen</addr-line>, <country>Norway</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>School of Artificial Intelligence, Sun Yat-sen University</institution>, <addr-line>Zhuhai</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Wenli Zhong, Ocean University of China, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Qi Shu, Ministry of Natural Resources, China; Peng Lu, Dalian University of Technology, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Xuewei Li, <email xlink:href="mailto:lixw39@mail.sysu.edu.cn">lixw39@mail.sysu.edu.cn</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>23</day>
<month>10</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>10</volume>
<elocation-id>1260047</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>07</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>04</day>
<month>10</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Lin, Yang, Li, Yang, Wang, Wang, Liu, Chen and Liu</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Lin, Yang, Li, Yang, Wang, Wang, Liu, Chen and Liu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The Arctic sea ice plays a significant role in climate-related processes and has a considerable effect on humans, however accurately predicting the Arctic sea ice concentration is still challenging. Recently, with the rise and development of artificial intelligence, big data technology, machine learning has been widely used in the field of sea ice prediction. In this study, we utilized a sea ice concentration dataset obtained from satellite remote sensing and applied the k-nearest-neighbors (Ice-kNN) machine learning model to forecast the summer Arctic sea ice concentration and extent on 122 days prediction. Based on the physical characteristics of summer sea ice, different algorithms are employed to optimize the prediction model. A drift-ice correction algorithm is designed to address the unrealistic drift ice around the sea ice edge, and a distance function combined with the spatial pattern is proposed to enhance similarity detection. Deseasonalized and detrended sea ice datasets and an expanded training library are also utilized to improve model performance. Furthermore, sensitivity analysis reveals a positive impact of net surface heat flux on sea ice prediction. The modified Ice-kNN model outperforms climatological and anomaly persistence predictions, demonstrating its applicability to predicting summer Arctic sea ice. The September sea ice extent hindcasts of the modified Ice-kNN model are compared to a variety of models submitted to the Sea Ice Prediction Network, underscoring its potential to improve predictive skill for Arctic sea ice.</p>
</abstract>
<kwd-group>
<kwd>sea ice prediction</kwd>
<kwd>summer Arctic</kwd>
<kwd>machine learning</kwd>
<kwd>KNN</kwd>
<kwd>optimization</kwd>
</kwd-group>
<counts>
<fig-count count="9"/>
<table-count count="1"/>
<equation-count count="3"/>
<ref-count count="43"/>
<page-count count="16"/>
<word-count count="7187"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Physical Oceanography</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Sea ice is important for climate processes such as heat, momentum, and material exchange between the ocean and the atmosphere (<xref ref-type="bibr" rid="B16">Lindsay et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B32">Steele et&#xa0;al., 2008</xref>). It also has a variety of ecological and social impacts, for example, the melting of sea ice affects species interaction, population mixing, productivity, and disease transmission (<xref ref-type="bibr" rid="B27">Post et&#xa0;al., 2013</xref>).</p>
<p>In recent years, the marked decline in Arctic sea ice extent (SIE; defined as the area of the ocean where the sea ice concentration is more than 15%) has caused widespread international concern (<xref ref-type="bibr" rid="B34">Stroeve et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B13">Kwok, 2018</xref>; <xref ref-type="bibr" rid="B33">Stroeve &amp; Notz, 2018</xref>). The smallest decline occurred in winter, while the largest occurred in September. The trend for September over the period 1979-2017 was -83,000 km<sup>2</sup>/year, or -13.0% per decade when compared to the average extent for 1981-2010 (<xref ref-type="bibr" rid="B30">Serreze &amp; Meier, 2019</xref>). The loss of sea ice has transformed the once unnavigable Arctic region into a seasonally navigable region (<xref ref-type="bibr" rid="B20">Melia et&#xa0;al., 2016</xref>). Affected by sea ice seasonal fluctuations, forecasting of sea ice in summer is vital to the safety and efficiency of navigation in the Arctic (<xref ref-type="bibr" rid="B36">Vihma, 2014</xref>; <xref ref-type="bibr" rid="B37">Wang et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B4">Chen et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B22">Min et&#xa0;al., 2022</xref>). Accurate sea ice forecasts in the summer months can also aid in mitigating potential hazards posed to navigation, such as navigation delays, collisions, and navigation errors. Furthermore, reliable predictions of SIE enable better planning and resource allocation for Arctic shipping endeavors, helping to ensure that the safest and most economical routes are used.</p>
<p>Since 2008, the Sea Ice Prediction Network (SIPN) has been collecting predictions of Arctic September SIE from contributors around the world (<xref ref-type="bibr" rid="B2">Bhatt et&#xa0;al., 2022a</xref>). SIPN has requested participants to submit their predicted September Arctic SIE during early June, July, August, and September. Through these submissions, SIPN provides an indication of the current prediction status of summer Arctic sea ice on the sub-seasonal-to-seasonal (S2S) timescale. Most contributors utilize dynamic models and statistical models. However, according to the predictive September SIEs submitted to SIPN, accurately predicting the Arctic SIE and spatial distribution of Arctic sea ice concentration (SIC) on the S2S timescale is still challenging, especially in September when SIE is at its minimum for the year (<xref ref-type="bibr" rid="B39">Wei et&#xa0;al., 2021</xref>).</p>
<p>With the recent advances in machine learning techniques, machine learning has been widely applied to Earth system analyses in recent years (<xref ref-type="bibr" rid="B28">Reichstein et&#xa0;al., 2019</xref>), which has resulted in substantial progress in the forecasting of Arctic sea ice. <xref ref-type="bibr" rid="B6">Chi and Kim (2017)</xref> used a fully data-driven deep learning long short-term memory (LSTM) model to predict the monthly Arctic sea ice in 2015. <xref ref-type="bibr" rid="B12">Jun Kim et&#xa0;al. (2020)</xref> used a convolutional neural network (CNN), to predict the monthly Arctic sea ice during 2000&#x2013;2017. <xref ref-type="bibr" rid="B1">Andersson et&#xa0;al. (2021)</xref> established the monthly distribution probability model IceNet of Arctic sea ice based on a U-Net structure, and compared it with the SEAS5 model. IceNet has better predictive skill than the SEAS5 model and the linear trend model for extreme events. <xref ref-type="bibr" rid="B24">Mu et&#xa0;al. (2023)</xref> constructed the Ice Temporal Fusion Transformer (IceTFT) model with 11 predictors to directly predict the 12-month SIE. Its prediction error for September SIE nine months in advance is less than 0.1 &#xd7; 10<sup>6</sup> km<sup>2</sup>. The above models mainly focus on the monthly sea ice, rather than the daily sea ice. <xref ref-type="bibr" rid="B8">Fritzner et&#xa0;al. (2020)</xref> designed two machine learning models, namely, a fully convolutional network (FCN) and k-nearest-neighbors (kNN) to forecast the Arctic sea ice for one to four weeks. The predictive skill of FCN model was similar to that of the dynamic model, Metroms. It is worth noting that the kNN model performs the best among all models for the seven-day predictive skill.</p>
<p>In general, since CNN excelling in image and signal processing tasks by capturing spatial relations, many studies have employed convolutional neural networks, either independently or as part of more complex networks, to tackle the challenge of spatial prediction for sea ice. On the other hand, some researchers have utilized traditional time series models to address point-to-point sea ice prediction. The selection of these models hinges upon the specific problem at hand, the available data, and the desired level of performance. It is often advantageous to explore diverse algorithms and techniques to discern the most suitable approach for the given task. kNN is one of the most commonly used machine learning methods (<xref ref-type="bibr" rid="B35">Thanh Noi and Kappas, 2017</xref>; <xref ref-type="bibr" rid="B42">Zhang et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B43">Zhang et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B8">Fritzner et&#xa0;al., 2020</xref>). The kNN model has many advantages compared to other machine learning models. These include its simplicity, low computational cost, and robustness in dealing with noisy training data. It is also a non-parametric model. That means its performance is not affected by changes in the underlying data distribution. Additionally, it is highly effective with datasets that contain multiple classes and can easily deal with new instances of data, making it ideal for real-world applications (<xref ref-type="bibr" rid="B7">Deng et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B35">Thanh Noi and Kappas, 2017</xref>; <xref ref-type="bibr" rid="B43">Zhang et&#xa0;al., 2018</xref>). In <xref ref-type="bibr" rid="B8">Fritzner et&#xa0;al. (2020)</xref>, the kNN model outperformed both the FCN and dynamic models in weather-scale forecasting, yet it demonstrated a lack of spatial connectivity and forecast an unrealistic abundance of drift ice around the sea ice edge in long-term-scale predictions.</p>
<p>In this study, we focus on the sea ice forecast during summer (June&#x2013;September) on 122 days prediction, with the aim of optimizing the kNN-based method and exploring the potential of the prediction ability of summer Arctic SIC. Our study advances previous work in two respects. First, the Ice-kNN model removes some of the unrealistic drift ice around the sea ice edge using a drift-ice correction algorithm. Second, we present different processes for the key steps of the Ice-kNN model to enhance the accuracy of the summer daily Arctic SIC predictions. The remaining sections of this paper are organized as follows: Section 2 describes the data used in this study and presents different processes used in the Ice-kNN model. Section 3 evaluates the hindcast skill of the Ice-kNN models and provides a comparison with the September SIEs submitted to the SIPN. Finally, Section 4 provides a summary and discussion of the findings.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Dataset</title>
<p>In this study, daily Arctic SIC data on a 25 &#xd7; 25&#xa0;km grid from 1979 to 2020 were obtained from the National Snow and Ice Data Centre (NSIDC; <ext-link ext-link-type="uri" xlink:href="http://nsidc.org">http://nsidc.org</ext-link>) (<xref ref-type="bibr" rid="B19">Maslanik and Stroeve, 1999</xref>). Multiple spaceborne remote sensing instruments, (e.g., the Nimbus 7 Scanning Multichannel Microwave Radiometer (SMMR) and the Special Sensor Microwave Imager (SSM/I and SSMIS) on board the Defense Meteorological Satellite Program (DMSP) satellites) have been used to generate this dataset. The SIC data are accessed starting from the 26th of October 1978 on alternate days until the 31st of July 1987 and subsequently on a daily basis. The missing data were obtained by the linear interpolation. Atmospheric data from the European Centre for Medium-Range Weather Forecasts (ECMWF) Re-Analysis 5 (ERA5) were used, including 2m temperature (T2m), sea-level pressure (SLP), and surface net heat flux (Sflux, which is calculated by summing up surface latent heat flux, surface sensible heat flux, surface net long-wave radiation flux and surface net short-wave radiation flux) from 1982 to 2020 with a 0.25&#xb0; &#xd7; 0.25&#xb0; horizontal resolution (<xref ref-type="bibr" rid="B10">Hersbach et&#xa0;al., 2020</xref>). In addition, daily reanalysis sea surface temperature (SST) data from the NOAA Optimum Interpolation SST, version 2.1, dataset (OISST) for the period of 1982-2020 with a horizontal resolution of 0.25&#xb0; &#xd7; 0.25&#xb0; were used (<xref ref-type="bibr" rid="B11">Huang et&#xa0;al., 2021</xref>). Due to the SST warm bias over the ice-covered regions, only SST data where SIC is less than 15% were used. Both atmospheric and oceanic data fields were standardized to ensure that the dimensions of the SIC and the atmospheric and oceanic data fields are consistent. The reanalysis datasets were re-gridded to the polar stereographic 25&#xa0;km EASE-Grid by linear interpolation.</p>
</sec>
<sec id="s3">
<label>3</label>
<title>Methods</title>
<sec id="s3_1">
<label>3.1</label>
<title>Traditional kNN model</title>
<p>For a given target unlabeled sample <inline-formula>
<mml:math display="inline" id="im1">
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mtext>t</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, we find the most similar state called the nearest labeled samples <inline-formula>
<mml:math display="inline" id="im2">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>&#xa0;x</mml:mtext>
</mml:mrow>
<mml:msup>
<mml:mtext>t</mml:mtext>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, from a library based on distance function. Then, the subsequent evolution <inline-formula>
<mml:math display="inline" id="im3">
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mrow>
<mml:msup>
<mml:mtext>t</mml:mtext>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>&#x3c4;</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> of the <inline-formula>
<mml:math display="inline" id="im4">
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:msup>
<mml:mtext>t</mml:mtext>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are weight averaged based on combination functions to calculate <inline-formula>
<mml:math display="inline" id="im5">
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mrow>
<mml:mtext>t&#xa0;+&#x3c4;</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. To construct the forecast, the nearest labeled samples are weighted as follows:</p>
<disp-formula>
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mrow>
<mml:mtext>t&#xa0;+&#x3c4;</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mtext>&#xa0;=</mml:mtext>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mn>i&#xa0;=&#xa0;1</mml:mn>
</mml:mrow>
<mml:mtext>k</mml:mtext>
</mml:munderover>
</mml:mstyle>
<mml:msub>
<mml:mtext>w</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
<mml:msubsup>
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>x</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mtext>t</mml:mtext>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
<mml:mo>+</mml:mo>
<mml:mi>&#x3c4;</mml:mi>
</mml:mrow>
<mml:mtext>i</mml:mtext>
</mml:msubsup>
<mml:mtext>&#xa0;</mml:mtext>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im6">
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mrow>
<mml:mtext>t&#xa0;+&#x3c4;</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the predicted variable with lead time <italic>&#x3c4;</italic>, <inline-formula>
<mml:math display="inline" id="im7">
<mml:mrow>
<mml:msub>
<mml:mtext>w</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the weight corresponding to the <italic>i</italic>
<sup>th</sup> selected nearest labeled sample; <italic>k</italic> is the number of the nearest labeled samples, <inline-formula>
<mml:math display="inline" id="im8">
<mml:msup>
<mml:mtext>t</mml:mtext>
<mml:mo>&#x2032;</mml:mo>
</mml:msup>
</mml:math>
</inline-formula> is the historical period of t. The w<sub>i</sub> values are kept constant in the forecast and do not change with the lead time <italic>&#x3c4;</italic>.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Experiments design</title>
<p>A control run named Ice-kNN-Ctrl was constructed according to the traditional kNN model. The traditional kNN model has three main procedures that can influence the predictive skill, namely, the distance function, which measures the similarity between samples, the selection of the k value, and the combination function based on the closest labeled samples (<xref ref-type="bibr" rid="B42">Zhang et&#xa0;al., 2017</xref>). Our research focuses on how to organically adapt the physical properties of sea ice to the kNN model, instead of adjusting the parameters. Therefore, Ice-kNN-Ctrl used Euclidean distance to measure the similarity, which is one of the most commonly used distance functions (<xref ref-type="bibr" rid="B42">Zhang et&#xa0;al., 2017</xref>); the combination function was set as distance weighting, which assigns weights inverse to the distance and prioritizes the examination of local structures surrounding the samples to be predicted; only SIC was used as input data to calculate the Euclidean distance. A group of hindcast experiments with different k values were conducted and it is found that the prediction results were insensitive to k values (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S1</bold>
</xref>). Therefore, the k value for Ice-kNN-Ctrl is only 3.</p>
<p>In this study, following <xref ref-type="bibr" rid="B40">Yang et&#xa0;al. (2020)</xref>, the summer Arctic sea ice prediction is typically initialized on 1st June. The SIC forecasts are conducted for the independent period from June to September, 2011&#x2013;2020, which does not overlap with the training period from June to September, 1979 to 2010.</p>
<p>Built on Ice-kNN-Ctrl, we selected different processes for the key steps of the prediction model to optimize its results in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. These algorithms were identified in advance by our sensitivity experiments to have a considerable impact on the SIC predictive skill. The key steps of the prediction model are: data preprocessing of deseasonalization and detrending; a drift-ice correlation algorithm; expansion of the training library; a distance function; and predictors. <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref> illustrates the processes of forecasting the SIC using Ice-kNN.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Experiment design using the kNN model for the optimization.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Model</th>
<th valign="middle" align="center">Preprocessing</th>
<th valign="middle" align="center">Drift ice correlation</th>
<th valign="middle" align="center">Expand the training library</th>
<th valign="middle" align="center">Distance function</th>
<th valign="middle" align="center">Predictors</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Ice-kNN-Ctrl</td>
<td valign="middle" align="center">
<bold>No</bold>
</td>
<td valign="middle" rowspan="2" align="center">No</td>
<td valign="middle" rowspan="2" align="center">No</td>
<td valign="middle" rowspan="2" align="center">Euclidean distance</td>
<td valign="middle" rowspan="2" align="center">SIC</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-An</td>
<td valign="middle" align="center">
<bold>Yes</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-F</td>
<td valign="middle" rowspan="2" align="center">Yes</td>
<td valign="middle" align="center">
<bold>Full-field</bold>
</td>
<td valign="middle" rowspan="2" align="center">No</td>
<td valign="middle" rowspan="2" align="center">Euclidean distance</td>
<td valign="middle" rowspan="2" align="center">SIC</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-FP</td>
<td valign="middle" align="center">
<bold>Full-field + pointwise</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-PA</td>
<td valign="middle" rowspan="2" align="center">Yes</td>
<td valign="middle" rowspan="2" align="center">Full-field + pointwise</td>
<td valign="middle" align="center">
<bold>past adjacent days</bold>
</td>
<td valign="middle" rowspan="2" align="center">Euclidean distance</td>
<td valign="middle" rowspan="2" align="center">SIC</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-PFA</td>
<td valign="middle" align="center">
<bold>past and future adjacent days</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-PC</td>
<td valign="middle" align="center">Yes</td>
<td valign="middle" align="center">Full-field + pointwise</td>
<td valign="middle" align="center">past adjacent days</td>
<td valign="middle" align="center">
<bold>spatial anomaly correlation coefficient + Euclidean distance</bold>
</td>
<td valign="middle" align="center">SIC</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-SLP</td>
<td valign="middle" rowspan="4" align="center">Yes</td>
<td valign="middle" rowspan="4" align="center">Full-field + pointwise</td>
<td valign="middle" rowspan="4" align="center">past adjacent days</td>
<td valign="middle" rowspan="4" align="center">spatial anomaly correlation coefficient + Euclidean distance</td>
<td valign="middle" align="center">
<bold>SIC + SLP</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-SST</td>
<td valign="middle" align="center">
<bold>SIC + SST</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-T2m</td>
<td valign="middle" align="center">
<bold>SIC + T2m</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Ice-kNN-Sflux</td>
<td valign="middle" align="center">
<bold>SIC + Sflux</bold>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>A flowchart showing the processing steps required of using Ice-kNN to predict Arctic sea ice.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g001.tif"/>
</fig>
<p>All experiments were conducted on the Intel Xeon E5-2609 (1.70GHz, 16 cores). The kNN model does not separate the time of training and prediction, so it needs to go through the training and prediction process all over again with each prediction. One 122-day prediction at an initial time costs about 300 seconds.</p>
<sec id="s3_2_1">
<label>3.2.1</label>
<title>Deseasonalization and detrending</title>
<p>Time series forecasting models must address the classical patterns frequently encountered in time series data: trend and seasonality. In contrast to the statistical methodologies, wherein established strategies are used to tackle seasonality, there is no universal agreement among computational intelligence methods for dealing with seasonal patterns. <xref ref-type="bibr" rid="B38">Wang et&#xa0;al. (2016)</xref> suggested that the application of detrending may lead to artificial mutation, causing the predicted value of the SIC to exceed the boundary value. Nevertheless, many studies have shown that using anomaly data can achieve better forecast skill (<xref ref-type="bibr" rid="B41">Yuan et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B12">Jun Kim et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B5">Chi et&#xa0;al., 2021</xref>). To determine whether Ice-kNN can benefit from detrending and deseasonalization steps, the Ice-kNN-An experiment was designed, in which the long-term linear trend and the climatological annual cycle of SIC had been subtracted at each grid point.</p>
</sec>
<sec id="s3_2_2">
<label>3.2.2</label>
<title>Drift-ice correlation</title>
<p>
<xref ref-type="bibr" rid="B8">Fritzner et&#xa0;al. (2020)</xref> indicated that in the kNN model, the modelling of each point is independent of each other, leading to frequent occurrence of drift ice in the Arctic marginal region in the forecast results. <xref ref-type="bibr" rid="B14">Li et&#xa0;al. (2020)</xref> proposed a method that considers full-field distance of variables and thus the best similarity type can be found. This method considers the spatial correlation of variables to a certain extent and thus alleviating the drift-ice problem in pointwise prediction. Therefore, this study proposed two drift-ice correlation algorithms: Full_Field (Ice-kNN-F) and Full_Field_Plus_Pointwise (Ice-kNN-FP). In Ice-kNN-F, the sample was defined as the whole pattern of the sea ice concentration anomaly (SICA) rather than single point of SICA. In other words, the features of the sample are expanded. In Ice-kNN-FP, the kNN model first defined the sample as the whole pattern of the SICA to predict the sea ice edge location where SIC greater than 0, and then defined the sample as the grid point of the SICA to predict the SIC within the sea ice edge.</p>
</sec>
<sec id="s3_2_3">
<label>3.2.3</label>
<title>Expand the training library</title>
<p>Owing to the limited length of the SIC satellite record, the training library for each target state has only 32-41 training samples from 2011 to 2020. As in previous studies (<xref ref-type="bibr" rid="B25">Mullan and Thompson, 2006</xref>; <xref ref-type="bibr" rid="B14">Li et&#xa0;al., 2020</xref>), the past adjacent calendar days are selected in the training library. In this way, the library for each target state was expanded threefold in Ice-kNN_Past_Adjacent_Days (Ice-kNN-PA). In addition, to further verify the sensitivity of predictive skill to the number of samples in training library, the past and future adjacent calendar days (which do not overlap with the forecast period) were selected in the training library in Ice-kNN_Past_Future_Adjacent_Days (Ice-kNN-PFA). A series of preliminary experiments were conducted with varying numbers of adjacent days. These experiments revealed that employing one adjacent day to expand the training library can yield desirable levels of both precision and efficiency (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S2</bold>
</xref>). Moderately increasing the training database can effectively make up for the lack of training data, but newly added data may contain noise or irrelevant information. If this data introduces incorrect patterns or inconsistencies, it can lead to larger errors. In addition, time-series data often exhibits strong temporal correlation. In kNN, data points from adjacent dates tend to have more similar features because they may be influenced by similar external factors or trends. However, when you add more adjacent calendar days, the model may not effectively capture this temporal correlation, leading to increased errors.</p>
</sec>
<sec id="s3_2_4">
<label>3.2.4</label>
<title>Distance function</title>
<p>Taking into consideration the spatial continuity of the gridded sea ice data, in Ice-kNN_Pattern_Correlation (Ice- kNN-PC), for a given unlabeled sample x<sub>t</sub>, the Euclidean distance and spatial anomaly correlation coefficient were both computed to measure the similarity between samples. The library was then sorted in descending order based on the spatial correlation between fields. The sample with the highest pattern correlation greater than threshold R was selected as the nearest labeled sample, provided that its distance was smaller than the corresponding 25th percentiles of the entire library. If the labeled sample did not satisfy these conditions, the next labeled sample in the list was evaluated. This process was repeated until three nearest labeled samples were identified, if available. If there was no training sample that satisfied these conditions, the training sample with the largest pattern correlation was chosen as the nearest labeled sample. Therefore, it was guaranteed that at least one labeled sample was found. We conducted a preliminary experiment to discuss the impact of different threshold values R on prediction skills. The results show that the prediction skills are best, especially for the lead time less than one month when the threshold R is selected as 0.2 (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S3</bold>
</xref>). Therefore, the threshold R of Ice-kNN-PC is set to 0.2.</p>
</sec>
<sec id="s3_2_5">
<label>3.2.5</label>
<title>Predictors</title>
<p>Four ice-related variables that have been frequently used in prior studies (<xref ref-type="bibr" rid="B41">Yuan et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B17">Liu et&#xa0;al., 2021</xref>), namely SLP, SST, T2m, and Sflux, along with SIC, were chosen to construct the Ice-kNN model. These four experiments are named Ice-kNN-SLP, Ice-kNN-SST, Ice-kNN-T2m, and Ice-kNN-Sflux, respectively.</p>
</sec>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Verification metrics</title>
<p>To assess the forecast skill of the experiments, the SIC predictions of the Ice-kNN model were evaluated at each grid cell using the RMSE of SIC (RMSE_SIC) and bias between the prediction and the observations at 1&#x2013;122 lead days. The bias is the difference between the prediction and observations for the 10-year average from 2011 to 2020. The Arctic is divided into five regions, as shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S4</bold>
</xref>. Owing to the rapid melting of sea ice in recent years, the grid points where SIC have not changed from 2011 to 2020 were excluded when calculating the regional mean predictive skill (<xref ref-type="bibr" rid="B6">Chi and Kim, 2017</xref>; <xref ref-type="bibr" rid="B12">Jun Kim et&#xa0;al., 2020</xref>).</p>
<p>For SIE verification, three metrics are used: (1) the error of the September monthly mean SIE (&#x394;<sup>SIE</sup>), (2) the RMSE of SIE (RMSE_SIE), and (3) the integrated ice edge error (IIEE) bias &#x394;<sup>IIEE</sup> (<xref ref-type="bibr" rid="B21">Melsom et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B8">Fritzner et&#xa0;al., 2020</xref>). The total extent (sum of cell areas where SIC &gt; 15%) for each day in September was computed and then averaged for the month for each year into a September mean SIE. The IIEE bias metric, &#x394;<sup>IIEE</sup>, is a measure of the relative difference in sea ice offset predicted by the model. It is computed from three parts, the overestimated and underestimated local SIE and the length of the ice edge. The overestimated part consists of sea ice-free areas that are predicted to be covered with sea ice, and the underestimated part consists of sea ice-covered areas that are predicted to be sea ice free. The length of the ice edge is determined by the ice edge of the observed and predicted fields. A positive &#x394;<sup>IIEE</sup> bias means that the overestimated SIE in the model is large relative to the underestimated SIE, and vice versa.</p>
<p>Sensitivity tests were conducted with the Ice-kNN model using SIC along with one extra variable as a predictor variable (<xref ref-type="bibr" rid="B12">Jun Kim et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B17">Liu et&#xa0;al., 2021</xref>). To examine the contribution of each predictor to the predictive skill of SIC, the sensitivity is defined as <italic>Sens</italic>_<italic>SIC</italic>; to examine the contribution to the predictive skill of SIE, the sensitivity is defined as <italic>Sens</italic>_<italic>SIE</italic>. The sensitivity formulas are as follows:</p>
<disp-formula>
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>s</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>I</mml:mi>
<mml:mi>C</mml:mi>
<mml:mfenced>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>I</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>I</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>I</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>s</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>I</mml:mi>
<mml:mi>E</mml:mi>
<mml:mfenced>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>I</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>I</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>I</mml:mi>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Here <italic>RMSE_SIC<sub>sic</sub>
</italic> (<italic>RMSE_SIE<sub>sic</sub>
</italic>) is the RMSE_SIC (RMSE_SIE) of forecast using only SIC, and the <italic>RMSE_SIC<sub>predictor</sub>
</italic> (<italic>RMSE_SIE<sub>predictor</sub>
</italic>) is the RMSE_SIC (RMSE_SIE) of forecast using SIC and one extra predictor.</p>
</sec>
</sec>
<sec id="s4" sec-type="results">
<label>4</label>
<title>Results</title>
<sec id="s4_1">
<label>4.1</label>
<title>Impacts of deseasonalization and detrending</title>
<p>To examine whether the data preprocessing strategy for removing the seasonality and trend could improve the forecast accuracy of the Ice-kNN model, the predictive skill of Ice-kNN-An is compared with that of Ice-kNN-Ctrl in this section. <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref> shows the comparison of the hindcast skill between Ice-kNN-An and Ice-kNN-Ctrl measured by the different verification metrics. The RMSE_SIC of Ice-kNN-Ctrl increases with the lead time and stays around 16% after one month (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). The RMSE_SIC and bias of Ice-kNN-Ctrl in September is mainly distributed in the regions where seasonal sea ice retreats from June to September, including the Beaufort Sea, Chukchi Sea, East Siberian Sea, and Laptev Sea, and it is higher than the climatological prediction in all studied areas (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4A</bold>
</xref>). For SIE, the RMSE_SIE of Ice-kNN-Ctrl increases with lead time and reaches 2.2 &#xd7; 10<sup>6</sup> km<sup>2</sup> in September (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). Compared with the observations, the prediction of Ice-kNN-Ctrl always overestimates SIE from June to September, and the overestimation gradually increases with the retreat of seasonal sea ice (<xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2C</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>S5A</bold>
</xref>). It may be related to the difficulty of marginal sea ice prediction and the prediction bias of the Ice-kNN model with the increasing prediction time (<xref ref-type="bibr" rid="B9">Guemas et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B17">Liu et&#xa0;al., 2021</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Hindcast skill comparison between Ice-kNN-Ctrl (black) and Ice-kNN-An (blue) measured by <bold>(A)</bold> spatial averaged RMSE_SIC, <bold>(B)</bold> RMSE_SIE, <bold>(C)</bold> <inline-formula>
<mml:math display="inline" id="im9">
<mml:mrow>
<mml:msup>
<mml:mi>&#x394;</mml:mi>
<mml:mrow>
<mml:mtext>IIEE</mml:mtext>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, and <bold>(D)</bold> <inline-formula>
<mml:math display="inline" id="im10">
<mml:mrow>
<mml:msup>
<mml:mi>&#x394;</mml:mi>
<mml:mrow>
<mml:mtext>SIE</mml:mtext>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g002.tif"/>
</fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Spatial averaged RMSE_SIC of the Ice-kNN model in hindcasting September SIC averaged from 2011 to 2020 in the <bold>(A)</bold> Beaufort Sea, <bold>(B)</bold> Chukchi Sea, <bold>(C)</bold> East Siberian&#x2013;Laptev seas, <bold>(D)</bold> Kara&#x2013;Barents-Greenland seas, and <bold>(E)</bold> Baffin Bay&#x2013;Canadian Archipelago.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g003.tif"/>
</fig>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>The prediction bias between the Ice-kNN model and the observation of <bold>(A)</bold> Ice-kNN-Ctrl-Bias, <bold>(B)</bold> Ice-kNN-An-Bias, <bold>(C)</bold> Ice-kNN-F-Bias, <bold>(D)</bold> Ice-kNN-FP-Bias, <bold>(E)</bold> Ice-kNN-PA-Bias, <bold>(F)</bold> Ice-kNN-PFA-Bias, <bold>(G)</bold> Ice-kNN-PC-Bias, <bold>(H)</bold> Ice-kNN-SLP-Bias, <bold>(I)</bold> Ice-kNN-SST-Bias, <bold>(J)</bold> Ice-kNN-T2m-Bias, and <bold>(K)</bold> Ice-kNN-Sflux-Bias in September averaged from 2011 to 2020. The black line represents the outline of the 10-year (2011-2020) mean extent for the September.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g004.tif"/>
</fig>
<p>For Ice-kNN-An, there is notable skill enhancement in predicting SIC at lead times longer than one month, and the enhancement of Ice-kNN-An is more pronounced with lead time (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). According to the spatial pattern, the September RMSE_SIC and bias of Ice-kNN-An in all areas is lower compared with Ice-kNN-Ctrl (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4A, B</bold>
</xref>). For SIE, although both Ice-kNN-An and Ice-kNN-Ctrl tend to overestimate SIE in summer, the predictive skill of Ice-kNN-An is significantly superior than that of Ice-kNN-Ctrl for summer SIE and the improvement increases with lead time (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2C</bold>
</xref>). This indicates that the Ice-kNN model can better find the temporal evolution of sea ice by extracting the seasonality and trend, especially from an ice-covered period to an ice-free period.</p>
<p>In extreme ice cover years, such as record low in 2012, the forecast biases are relatively large compared to other years for both models (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2D</bold>
</xref>). On the one hand, the lowest minimum Arctic SIE in 2012 is associated with the large multiyear ice volume export and the storm that entered into the central Arctic in early August 2012 (<xref ref-type="bibr" rid="B26">Parkinson &amp; Comiso, 2013</xref>; <xref ref-type="bibr" rid="B15">Li et&#xa0;al., 2022</xref>). Since the initial day is fixed on June 1st, it is hard for Ice-kNN model to catch the atmospheric disturbance in the extreme cases. On the other hand, for the extreme cases of SIE, Ice-kNN model is not suitable to forecast the extreme values which are not included in the training library due to its prediction principle. While in the other years, Ice-kNN-An shows an impressive improvement compared with Ice-kNN-Ctrl (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2D</bold>
</xref>). However, there is still considerable drift ice outside the sea ice edge in both experiments (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figures S5A, B</bold>
</xref>).</p>
<p>The improvement of Ice-kNN-An indicates that the deseasonalization and detrending step is useful to improve the Arctic sea ice forecast accuracy of the Ice-kNN model. Therefore, the data preprocessing strategy was used to remove the seasonality and the trend components in subsequent experiments.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Impact of drift-ice correlation</title>
<p>Due to the lack of spatial continuity in the traditional kNN model, both Ice-kNN-Ctrl and Ice-kNN-An forecasts showed unrealistic drift ice around the sea ice edge (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figures S5A, B</bold>
</xref>). This section studies the impact of different drift-ice correction algorithms in the Ice-kNN prediction. As shown in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>, the RMSE_SIC of Ice-kNN-F shows poor predictive skill at lead times of less than 30 days, but it is better than Ice-kNN-An at lead times longer than 30 days. According to the distribution of September RMSE_SIC and bias, Ice-kNN-F is superior to Ice-kNN-An in predicting SIC in September in all sea areas except the Chukchi Sea (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4B, C</bold>
</xref>). The results show that the pointwise modeling is better for the prediction of SICA caused by short-term-scale disturbances, whereas for the SICA caused by large-scale anomalies, selecting the similarity using the full-field distance could improve the predictive skill with lead times of more than one month. Ice-kNN-FP predicted the SIC point by point based on Ice-kNN-F determination of the sea ice edge. It performs better than Ice-kNN-F at lead times of less than 30 days and better than Ice-kNN-An at lead times of longer than 30 days (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>). In addition, Ice-kNN-FP has a lower unrealistic drift-ice bias compared with Ice-kNN-An, especially in the Chukchi, East Siberian, Laptev, and Kara seas (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>S5B, D</bold>
</xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Hindcast skill comparison between Ice-kNN-An (black), Ice-kNN-F (blue), and Ice-kNN-FP (orange) measured by <bold>(A)</bold> spatial averaged RMSE_SIC, <bold>(B)</bold> RMSE_SIE, <bold>(C)</bold> &#x394;<sup>IIEE</sup>, and <bold>(D)</bold> &#x394;<sup>SIE</sup>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g005.tif"/>
</fig>
<p>For SIE, the prediction bias of Ice-kNN-F in the short-term lead time is larger. However, Ice-kNN-FP, which combines full-field distance and single-point distance, shows a significant improvement in sea ice edge compared with Ice-kNN-F and Ice-kNN-An for the whole lead time (<xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5B, C</bold>
</xref>). In <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>, it can be seen that Ice-kNN-FP effectively reduces the bias of the September mean SIE in Ice-kNN-F and Ice-kNN-An in most years.</p>
<p>The kNN model, which takes only a single grid point as the prediction sample, lacks physical spatial connection, and leads to the prediction of unrealistic drift ice. A drift-ice correlation algorithm, which selects similarity by full-field distance, would consider the spatial continuity of sea ice but ignore the local SICA caused by short-term disturbance. Therefore, the full-field distance is first used to limit the sea ice coverage, and then pointwise modelling is carried out to predict the SIC of each single grid point, which can effectively correct the unrealistic drift ice of pointwise modelling and the initial sea ice migration bias of full-field modelling. In the following kNN models, the drift-ice correction algorithm of Ice-kNN-FP is applied.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Impact of expanding the training library</title>
<p>In principle, the nearest neighbors with insufficient similarity could diverge relatively quickly in time compared with the very close nearest neighbors. The limited Ice-kNN forecast skill may therefore be partly due to the relatively small number of available training labeled samples, which makes the nearest neighbor selection a challenge. As the most accurate summer SIC datasets are limited to the satellite era starting in the 1979, the training labeled samples for each state has only 32 to 41 members from 2011 to 2020. To verify the sensitivity of the predictive skill to the number of training labeled samples, Ice-kNN-PA and Ice-kNN-PFA expand the training library by adding adjacent calendar days. The number of training labels samples in Ice-kNN-PA increases from 96 to 123 from 2011 to 2020, and that in Ice-kNN-PFA increases to 123.</p>
<p>Compared with Ice-kNN-FP, the RMSE_SICs of the Ice-kNN-PA and Ice-kNN-PFA seems not to be significantly reduced (<xref ref-type="fig" rid="f6"><bold>Figure 6A</bold></xref>), but from the perspective of different sea areas, the Ice-kNN-PA and Ice-kNN-PFA mainly reduced the positive SIC bias in the sea ice marginal zone of Beaufort Sea and the East SiberianLaptev seas (<xref ref-type="fig" rid="f4"><bold>Figures 4D&#x2013;F</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>S6A, B</bold></xref>). For SIE, Ice-kNN-PA and Ice-kNN-PFA have a larger initial bias at lead times of less than two weeks (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref>), which is mainly due to the underestimation of SIE (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6C</bold>
</xref>). However, Ice-kNN-PA and Ice-kNN-PFA show significant improvement in predicting SIE after that (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6B, C</bold>
</xref>). In <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6D</bold>
</xref>, except for 2017 in Ice-kNN-PFA, the September mean SIE bias of Ice-kNN-PA and Ice-kNN-PFA is reduced by about 0.5 million square kilometers compared with Ice-kNN-FP.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Hindcast skill comparison between Ice-kNN-FP (black), Ice-kNN-PA (blue), and Ice-kNN-PFA (orange) measured by <bold>(A)</bold> spatial averaged RMSE_SIC, <bold>(B)</bold> RMSE_SIE, <bold>(C)</bold> &#x394;<sup>IIEE</sup>, and <bold>(D)</bold> &#x394;<sup>SIE</sup>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g006.tif"/>
</fig>
<p>In general, expanding the training library will cause an initial underestimation bias, but it will not rapidly diverge with increasing lead time. The predictive skill of the experiments that use the expanded training library are significantly improved compared with Ice-kNN-FP with lead times of more than two weeks. Using the future adjacent calendar days as the training labeled samples has relatively little impact, except for 2017 when Ice-kNN-PFA selects future sample as the nearest sample. The younger and thinner Arctic sea ice in recent years is more sensitive to external forcing (<xref ref-type="bibr" rid="B26">Parkinson &amp; Comiso, 2013</xref>), resulting in a large deviation in the forecast results when the future adjacent calendar days are selected in the training library.</p>
<p>Therefore, selecting sufficient training labeled samples could better improve the predictive skill of the Ice-kNN model for Arctic sea ice. In subsequent experiments, the strategy of expanding the training library by adding past adjacent calendar days as training labeled samples to predict the Arctic sea ice was applied.</p>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>Impact of distance function</title>
<p>In previous Ice-kNN models, the Euclidean distance has been selected most frequently as the distance function. In the prediction of sea ice, not only the distance between grid cells but also the spatial correlation coefficient between states should be considered to select similarity. In this section, a compound distance function scheme, including the spatial anomaly correlation coefficient and the Euclidean distance between sea ice, is studied.</p>
<p>As shown in <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7A</bold>
</xref>, the RMSE_SIC of Ice-kNN-PC is comparable to that of Ice-kNN-PA. According to the spatial pattern, the September RMSE_SIC and bias of Ice-kNN-PC decreases in the East Siberian&#x2013;Laptev seas and Kara&#x2013;Barents&#x2013;Greenland seas, but increases in the Beaufort Sea, Chukchi Sea, and Baffin Bay&#x2013;Canadian Archipelago compared with Ice-kNN-PA (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4F, G</bold>
</xref>). For the SIE, the RMSE_SIE of Ice-kNN-PC has a larger bias at lead times of less than one week (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7B</bold>
</xref>), which is mainly due to the underestimation of SIE (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7C</bold>
</xref>). However, Ice-kNN-PC shows improvement in SIE compared with Ice-kNN-PA at lead times of more than one week and the improvement is more pronounced with increasing lead time (<xref ref-type="fig" rid="f7">
<bold>Figures&#xa0;7B, C</bold>
</xref>). In the <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7D</bold>
</xref>, except for 2012, the biases of monthly mean SIE in September of Ice-kNN-PC from 2011 to 2020 are within about 0.5 million square kilometers, which is lower than Ice-kNN-PA.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Hindcast skill comparison between Ice-kNN-PA (black) and Ice-kNN-PC (blue) measured by <bold>(A)</bold> spatial averaged RMSE_SIC, <bold>(B)</bold> RMSE_SIE, <bold>(C)</bold> &#x394;<sup>IIEE</sup>, and <bold>(D)</bold> &#x394;<sup>SIE</sup>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g007.tif"/>
</fig>
<p>In general, the composite distance function with a spatial anomaly correlation coefficient is beneficial to the prediction of Arctic sea ice. The new distance function considers not only the similarity between samples at a single point through the Euclidean distance but also the spatial mode of the SICA through the spatial anomaly correlation coefficient. It is helpful for the Ice-kNN model to consider the large-scale spatial variation of SICA when selecting the similarity. Therefore, in the following experiments, a composite distance function combining the Euclidean distance and the spatial anomaly correlation coefficient is used to further improve the predictive skill of the Ice-kNN model.</p>
</sec>
<sec id="s4_5">
<label>4.5</label>
<title>Impact of sea ice-related predictors</title>
<p>To verify the impact of sea ice-related atmospheric and oceanic variables on the predictive skill of summer Arctic sea ice, SIC and SIE sensitivity indices including sea ice-related variables were calculated based on the Ice-kNN-PC model in <xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8</bold>
</xref>. A positive sensitivity index indicates that a variable has a positive contribution to the predictive skill of SIC (SIE).</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>The monthly mean sensitivity indexes from June to September of <bold>(A)</bold> RMSE_SIC-based for SIC and <bold>(B)</bold> RMSE_SIE-based for SIE with kNN using different predictors (blue, SIC/SLP; orange, SIC/SST; grey, SIC/T2m; yellow, SIC/Sflux).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g008.tif"/>
</fig>
<p>Ice-kNN-Sflux, which selects Sflux and SIC as predictors, improves the predictive skill of SIC for the whole lead time (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8A</bold>
</xref>). SST improves the predictive skill at lead times of less than one month, but SLP and T2m provide only limited improvement in the predictive skill at lead times of about one to two months (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8A</bold>
</xref>). According to the distribution of RMSE_SIC and bias in September, the improvement of the predictive skill of Ice-kNN-Sflux mainly occurs in the Beaufort Sea, compared with Ice-kNN-PC (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3A</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4G&#x2013;K</bold>
</xref>). For SIE, the sensitivity index is calculated based on the RMSE_SIE. All the sea ice-related variables show improvement of the SIE predictive skill at lead times of less than one month. But for lead times longer than one month, all the sea ice-related variables show negative contributions to the predictive skill of SIE.</p>
<p>The predictive skill of Ice-kNN-Sflux for SIC is significantly better than both the climatological prediction and the anomaly persistence prediction at lead times of longer than two weeks (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S7</bold>
</xref>). The predictive skill of Ice-kNN-Sflux for September SIC is significantly better than the anomaly persistence prediction for the whole Arctic, and significantly better than the climatological prediction for the whole Arctic, except for Baffin Bay and the Canadian Islands (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). The prediction bias of Ice-kNN-Sflux in September SIE is reduced by 2.0 &#xd7; 10<sup>6</sup> km<sup>2</sup> compared with the climatological prediction and by 3.0 &#xd7; 10<sup>6</sup> km<sup>2</sup> compared with the anomaly persistence prediction.</p>
<p>In general, for daily Arctic sea ice forecasts in summer, the Sflux fields, which have a direct relation to sea ice (<xref ref-type="bibr" rid="B17">Liu et&#xa0;al., 2021</xref>), can enhance the predictive skill of sea ice. SLP and T2m show little improvement of the predictive skill of sea ice, which may result from the chaotic behavior of the atmosphere (<xref ref-type="bibr" rid="B23">Mohammadi-Aragh et&#xa0;al., 2018</xref>). While the surface oceanic field SST does not show its long-term memory, which may result from the interpolation bias. Similar results were obtained in <xref ref-type="bibr" rid="B17">Liu et&#xa0;al. (2021)</xref> using the deep learning model ConvLSTM.</p>
</sec>
<sec id="s4_6">
<label>4.6</label>
<title>Comparison of SIE</title>
<p>The Sea Ice Prediction Network (SIPN) is an open platform that has been collecting predictions of Arctic SIE in September around the world since 2008, then compiling and presenting them to those interested in Arctic sea ice. September SIE predictions have been submitted to the SIPN in June, July, and August since 2008, with an additional September submission added in 2021. There are a variety of prediction methods, including heuristic, statistical, mixed, dynamic, and machine learning/other. To further evaluate the Arctic sea ice forecast skill of Ice-kNN model, we compared the Arctic September SIEs in 2021 and 2022 using the Ice-kNN-Sflux model with the observations and the contributions for the September SIE predictions to the Post-Season Sea Ice Outlook for 2021 and 2022 (<xref ref-type="bibr" rid="B2">Bhatt et&#xa0;al., 2022a</xref>; <xref ref-type="bibr" rid="B3">Bhatt et&#xa0;al., 2022b</xref>). We utilized the SIC of May 31, June 30, July 31 and August 31 respectively as the input of Ice-kNN-Sflux model to predict the September SIEs. It should be noted here we use a hindcast (not real-time forecast) result of the Ice-kNN-Sflux model.</p>
<p>As shown in <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9A</bold>
</xref>, the observed September SIE in 2021 was 4.92 &#xd7; 10<sup>6</sup> km<sup>2</sup> (reported by NSIDC). The median hindcasting result of Ice-kNN-Sflux from June to September is 4.8 &#xd7; 10<sup>6</sup> km<sup>2</sup>, with a quartile range of 4.62 to 5.04 &#xd7; 10<sup>6</sup> km<sup>2</sup> (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9A</bold>
</xref>). The median September estimate based on all contributors of SIPN were 4.37 &#xd7; 10<sup>6</sup>, 4.36 &#xd7; 10<sup>6</sup>, 4.39 &#xd7; 10<sup>6</sup>, and 4.39 &#xd7; 10<sup>6</sup> km<sup>2</sup>, respectively, from June to September. In comparison, our hindcasts using Ice-kNN-Sflux were 5.34 &#xd7; 10<sup>6</sup>, 4.94 &#xd7; 10<sup>6</sup>, 4.66 &#xd7; 10<sup>6</sup>, and 4.49 &#xd7; 10<sup>6</sup> km<sup>2</sup>, respectively (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1A</bold>
</xref>). For 2022, the medians September estimate of SIPN were 4.57 &#xd7; 10<sup>6</sup>, 4.64 &#xd7; 10<sup>6</sup>, 4.83 &#xd7; 10<sup>6</sup>, and 4.91 &#xd7; 10<sup>6</sup> km<sup>2</sup>, respectively, from June to September, which approaches observation 4.87 &#xd7; 10<sup>6</sup> km<sup>2</sup> (reported by the NSIDC). The hindcasts of Ice-kNN-Sflux from June to September were 5.05 &#xd7; 10<sup>6</sup>, 4.47 &#xd7; 10<sup>6</sup>, 5.65 &#xd7; 10<sup>6</sup>, and 4.62 &#xd7; 10<sup>6</sup> km<sup>2</sup> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1B</bold>
</xref>). The median hindcasting result of Ice-kNN-Sflux from June to September is 4.835 &#xd7; 10<sup>6</sup> km<sup>2</sup>, with a quartile range of 4.58 to 5.2 &#xd7; 10<sup>6</sup> km<sup>2</sup> (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9B</bold>
</xref>).</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>The SIPN forecast box plots for the estimates of September Arctic SIE in <bold>(A)</bold> 2021 and <bold>(B)</bold> 2022 by ML/Other (M/O), Mixed (M), Dynamic (Dy), Statistical (St) and Heuristic (He). Our model hindcasts of Ice-kNN-Sflux has been bolded. The data for this Figure were adapted from the Sea Ice Prediction Network.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1260047-g009.tif"/>
</fig>
</sec>
</sec>
<sec id="s5" sec-type="conclusions|discussion">
<label>5</label>
<title>Conclusions and discussion</title>
<p>In this study, a SIC dataset of remote sensing was utilized and a machine learning model, Ice-kNN, has been introduced and optimized to improve the prediction skill of summer Arctic SIC for a 122-day prediction. The results show that when the traditional kNN model is directly applied to predict the summer Arctic SIC, its September predictive skill is poorer than the climatological prediction for the whole Arctic, which is due to the inability of the kNN model to identify the seasonal variability of SIC in summer Arctic. To address this issue, we proposed different processes to improve the performance of the Ice-kNN model, including the data preprocessing of deseasonalization and detrending, a drift-ice correction algorithm, expansion of the training library, a distance function, and predictors. By using these algorithms, we aimed to optimize the results of the Ice-kNN model. Our sensitivity analysis revealed that the seasonalization and trends of the data need to be preprocessed to improve the identification of sea ice variability by the Ice-kNN model. Although the traditional kNN model has no spatial relation, the sea ice coverage can be constrained by defining the samples as a pattern of SICA and using the composite distance function combined with a spatial anomaly correlation coefficient and Euclidean distance. In addition, selecting sufficient training labeled samples improves the predictive skill of the Ice-kNN model for Arctic sea ice. Besides, the importance of sea ice-related variables was studied through sensitivity tests. The introduction of Sflux into the Ice-kNN model effectively improved the predictive skill of the model, whereas the addition of SLP, T2m, and SST did not significantly improve the predictive skill.</p>
<p>The Ice-kNN-Sflux model was evaluated against climatological and anomaly persistence predictions. There is notable skill enhancement in the hindcasts of Arctic sea ice using the Ice-kNN-Sflux model, which is more pronounced with increasing lead time. The September mean SIE of the Ice-kNN-Sflux hindcasts was reduced by about 2.0 &#xd7; 10<sup>6</sup> km<sup>2</sup> and 3.0 &#xd7; 10<sup>6</sup> km<sup>2</sup> compared with the climatological and the anomaly persistence predictions. In addition, the September SIE was found to be reasonably well predicted compared with the forecasts submitted to the SIPN in 2021 and 2022. Overall, our study provides important insights into predicting summer daily Arctic SIC and highlights the potential benefits of using modified Ice-kNN for this purpose.</p>
<p>Although this Ice-kNN model shows great potential for summer daily Arctic sea ice prediction, more experiments need to be conducted to improve the Ice-kNN model and examine its robustness. Future studies are needed to further expand the initial forecast days of the Ice-kNN model. In addition, the combined effects of the predictors mentioned in this study on the Ice-kNN model are not considered and Arctic SIC is also influenced by a variety of other factors, such as ice drift, surface albedo and ocean heat content (<xref ref-type="bibr" rid="B31">Shimada et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B29">Screen and Simmonds, 2010</xref>; <xref ref-type="bibr" rid="B18">Mahajan et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B17">Liu et&#xa0;al., 2021</xref>). Therefore, it is necessary to study different combinations of predictors and include more predictor variables related to sea ice for feature processing to strengthen the understanding of the multivariable processes.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>YL: Conceptualization, Data curation, Formal Analysis, Investigation, Methodology, Software, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review and editing. QY: Conceptualization, Funding acquisition, Project administration, Resources, Supervision, Writing &#x2013; review and editing. XL: Conceptualization, Investigation, Methodology, Resources, Supervision, Validation, Writing &#x2013; review and editing. CY: Conceptualization, Supervision, Writing &#x2013; review and editing. YW: Writing &#x2013; review and editing, Supervision. JW: Writing &#x2013; review and editing, Supervision. JinL: Writing &#x2013; review and editing, Conceptualization, Data curation, Investigation. SC: Writing &#x2013; review and editing, Data curation, Investigation. JipL: Supervision, Writing &#x2013; review and editing.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This work was supported by the Southern Marine Science and Engineering Guangdong Laboratory (Zhuhai) (NO. SML2020sp007), the Guangdong Basic and Applied Basic Research Foundation (No. 2020B1515020025), the National Key R&amp;D Program of China (No. 2022YFE0106300), the National Natural Science Foundation of China (No. 42106233, 42106226, 41922044) and the fundamental research funds for the Norges Forskningsr&#xe5;d (No. 328886).</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmars.2023.1260047/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmars.2023.1260047/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Presentation_1.pdf" id="SM1" mimetype="application/pdf"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andersson</surname> <given-names>T. R.</given-names>
</name>
<name>
<surname>Hosking</surname> <given-names>J. S.</given-names>
</name>
<name>
<surname>P&#xe9;rez-Ortiz</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Paige</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Elliott</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Russell</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Seasonal Arctic sea ice forecasting with probabilistic deep learning</article-title>. <source>Nat. Commun.</source> <volume>12</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>12</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-021-25257-4</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Bhatt</surname> <given-names>U. S.</given-names>
</name>
<name>
<surname>Bieniek</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Bitz</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Blanchard-Wrigglesworth</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Eicken</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Fisher</surname> <given-names>H. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>a) <source>2021 sea ice outlook post-season report</source>. Available at: <uri xlink:href="https://www.arcus.org/sipn/sea-ice-outlook/2021/post-season">https://www.arcus.org/sipn/sea-ice-outlook/2021/post-season</uri>.</citation>
</ref>
<ref id="B3">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Bhatt</surname> <given-names>U. S.</given-names>
</name>
<name>
<surname>Meier</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Blanchard-Wrigglesworth</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Massonnet</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Goessling</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Ludwig</surname> <given-names>V.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>b) <source>Sea ice outlook: 2022 post season report</source>. Available at: <uri xlink:href="https://www.arcus.org/sipn/sea-ice-outlook/2022/post-season">https://www.arcus.org/sipn/sea-ice-outlook/2022/post-season</uri>.</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.</given-names>
</name>
<name>
<surname>You</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Du</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Changes in sea ice and future accessibility along the Arctic Northeast Passage</article-title>. <source>Glob. Planet. Change</source> <volume>195</volume>, <elocation-id>103319</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.gloplacha.2020.103319</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chi</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Bae</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Kwon</surname> <given-names>Y. J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Two-stream convolutional long-and short-term memory model using perceptual loss for sequence-to-sequence arctic sea ice prediction</article-title>. <source>Remote Sens.</source> <volume>13</volume> (<issue>17</issue>), <elocation-id>3413</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs13173413</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chi</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>H. C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Prediction of Arctic sea ice concentration using a fully data driven deep neural network</article-title>. <source>Remote Sens.</source> <volume>9</volume> (<issue>12</issue>), <elocation-id>1305</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs9121305</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deng</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zong</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Efficient kNN classification algorithm for big data</article-title>. <source>Neurocomputing</source> <volume>195</volume>, <fpage>143</fpage>&#x2013;<lpage>148</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.neucom.2015.08.112</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fritzner</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Graversen</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Christensen</surname> <given-names>K. H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Assessment of high-resolution dynamical and machine learning models for prediction of sea ice concentration in a regional application</article-title>. <source>J. Geophys. Res. Ocean.</source> <volume>125</volume> (<issue>11</issue>), <fpage>1</fpage>&#x2013;<lpage>23</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2020JC016277</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guemas</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Blanchard-Wrigglesworth</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Chevallier</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Day</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>D&#xe9;qu&#xe9;</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Doblas-Reyes</surname> <given-names>F. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>A review on Arctic sea-ice predictability and prediction on seasonal to decadal time-scales</article-title>. <source>Q. J. R. Meteorol. Soc</source> <volume>142</volume> (<issue>695</issue>), <fpage>546</fpage>&#x2013;<lpage>561</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/qj.2401</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hersbach</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Bell</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Berrisford</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Hirahara</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hor&#xe1;nyi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Mu&#xf1;oz Sabater</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>The ERA5 global reanalysis</article-title>. <source>Q. J. R. Meteorolog. Soc.</source> <volume>146</volume> (<issue>730</issue>), , <fpage>1999</fpage>&#x2013;<lpage>2049</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/qj.3803</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Banzon</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Freeman</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Graham</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Hankins</surname> <given-names>B.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Improvements of the daily optimum interpolation sea surface temperature (DOISST) version 2.1</article-title>. <source>J. Clim.</source> <volume>34</volume> (<issue>8</issue>), <fpage>2923</fpage>&#x2013;<lpage>2939</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/JCLI-D-20-0166.1</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jun Kim</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>H. C.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Im</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Prediction of monthly Arctic sea ice concentrations using satellite and reanalysis data based on convolutional neural networks</article-title>. <source>Cryosphere</source> <volume>14</volume> (<issue>3</issue>), <fpage>1083</fpage>&#x2013;<lpage>1104</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/tc-14-1083-2020</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kwok</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Arctic sea ice thickness, volume, and multiyear ice coverage: Losses and coupled variability, (1958-2018)</article-title>. <source>Environ. Res. Lett.</source> <volume>13</volume> (<issue>10</issue>). doi:&#xa0;<pub-id pub-id-type="doi">10.1088/1748-9326/aae3ec</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Bordbar</surname> <given-names>M. H.</given-names>
</name>
<name>
<surname>Latif</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Park</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Harla&#xdf;</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Monthly to seasonal prediction of tropical Atlantic sea surface temperature with statistical models constructed from observations and data from the Kiel Climate Model</article-title>. <source>Clim. Dyn.</source> <volume>54</volume> (<issue>3&#x2013;4</issue>), <fpage>1829</fpage>&#x2013;<lpage>1850</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00382-020-05140-6</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Holland</surname> <given-names>P. R.</given-names>
</name>
<name>
<surname>Min</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Mu</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Unprecedented Arctic sea ice thickness loss and multiyear-ice volume export through Fram Strait during 2010-2011</article-title>. <source>Environ. Res. Lett.</source> <volume>17</volume> (<issue>9</issue>), <fpage>095008</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1088/1748-9326/ac8be7</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lindsay</surname> <given-names>R. W.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Schweiger</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Steele</surname> <given-names>M. A.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Seasonal predictions of ice extent in the Arctic Ocean</article-title>. <source>J. Geophys. Res. Ocean.</source> <volume>113</volume> (<issue>2</issue>), <fpage>1</fpage>&#x2013;<lpage>11</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2007JC004259</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Bogaardt</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Attema</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hazeleger</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Extended-range arctic sea ice forecast with convolutional long short-Term memory networks</article-title>. <source>Mon. Weather Rev.</source> <volume>149</volume> (<issue>6</issue>), <fpage>1673</fpage>&#x2013;<lpage>1693</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/MWR-D-20-0113.1</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahajan</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Delworth</surname> <given-names>T. L.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Impact of the atlantic meridional overturning circulation (AMOC) on arctic surface air temperature and sea ice variability</article-title>. <source>J. Clim.</source> <volume>24</volume> (<issue>24</issue>), <fpage>6573</fpage>&#x2013;<lpage>6581</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/2011JCLI4002.1</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maslanik</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Stroeve</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1999</year>). &#x201c;<article-title>Near-Real-Time DMSP SSMIS Daily Polar Gridded Sea Ice Concentrations, Version 1</article-title>.&#x201d; <source>NASA Nat. Snow Ice Data Center Distrib. Act. Arch. Center</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.5067/U8C09DWVX9LM</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Melia</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Haines</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Hawkins</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Sea ice decline and 21st century trans-Arctic shipping routes</article-title>. <source>Geophys. Res. Lett.</source> <volume>43</volume> (<issue>18</issue>), <fpage>9720</fpage>&#x2013;<lpage>9728</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/2016GL069315</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Melsom</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Palerme</surname> <given-names>C.</given-names>
</name>
<name>
<surname>M&#xfc;ller</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Validation metrics for ice edge position forecasts</article-title>. <source>Ocean Sci.</source> <volume>15</volume> (<issue>3</issue>), <fpage>615</fpage>&#x2013;<lpage>630</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/os-15-615-2019</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Min</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Shu</surname> <given-names>Q.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>The emerging arctic shipping corridors</article-title>. <source>Geophys. Res. Lett.</source> <volume>49</volume> (<issue>10</issue>), <fpage>1</fpage>&#x2013;<lpage>10</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2022GL099157</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mohammadi-Aragh</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Goessling</surname> <given-names>H. F.</given-names>
</name>
<name>
<surname>Losch</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hutter</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Jung</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Predictability of Arctic sea ice on weather time scales</article-title>. <source>Sci. Rep.</source> <volume>8</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>7</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-018-24660-0</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Mu</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2023</year>) <source>IceTFT v 1 . 0 . 0 : interpretable long-term prediction of arctic sea ice extent with deep learning</source> (Accessed <access-date>January, 1&#x2013;28</access-date>).</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mullan</surname> <given-names>A. B.</given-names>
</name>
<name>
<surname>Thompson</surname> <given-names>C. S.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Analogue forecasting of New Zealand climate anomalies</article-title>. <source>Int. J. Climatol.</source> <volume>26</volume> (<issue>4</issue>), <fpage>485</fpage>&#x2013;<lpage>504</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/joc.1261</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parkinson</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Comiso</surname> <given-names>J. C.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>On the 2012 record low Arctic sea ice cover: Combined impact of preconditioning and an August storm</article-title>. <source>Geophys. Res. Lett.</source> <volume>40</volume> (<issue>7</issue>), <fpage>1356</fpage>&#x2013;<lpage>1361</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/grl.50349</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Post</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Bhatt</surname> <given-names>U. S.</given-names>
</name>
<name>
<surname>Bitz</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Brodie</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>Fulton</surname> <given-names>T. L.</given-names>
</name>
<name>
<surname>Hebblewhite</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title>Ecological consequences of sea-ice decline</article-title>. <source>Science</source> <volume>341</volume> (<issue>6145</issue>), <fpage>519</fpage>&#x2013;<lpage>524</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.1235225</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reichstein</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Camps-Valls</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Stevens</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Jung</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Denzler</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Carvalhais</surname> <given-names>N.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Deep learning and process understanding for data-driven Earth system science</article-title>. <source>Nature</source> <volume>566</volume> (<issue>7743</issue>), <fpage>195</fpage>&#x2013;<lpage>204</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-019-0912-1</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Screen</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Simmonds</surname> <given-names>I.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>The central role of diminishing sea ice in recent Arctic temperature amplification</article-title>. <source>Nature</source> <volume>464</volume> (<issue>7293</issue>), <fpage>1334</fpage>&#x2013;<lpage>1337</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature09051</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Serreze</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Meier</surname> <given-names>W. N.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The Arctic&#x2019;s sea ice cover: trends, variability, predictability, and comparisons to the Antarctic</article-title>. <source>Ann. N. Y. Acad. Sci.</source> <volume>1436</volume> (<issue>1</issue>), <fpage>36</fpage>&#x2013;<lpage>53</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/nyas.13856</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shimada</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Kamoshida</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Itoh</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Nishino</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Carmack</surname> <given-names>E.</given-names>
</name>
<name>
<surname>McLaughlin</surname> <given-names>F.</given-names>
</name>
<etal/>
</person-group>. (<year>2006</year>). <article-title>Pacific Ocean inflow: Influence on catastrophic reduction of sea ice cover in the Arctic Ocean</article-title>. <source>Geophys. Res. Lett.</source> <volume>33</volume> (<issue>8</issue>), <fpage>3</fpage>&#x2013;<lpage>6</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2005GL025624</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Steele</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Ermold</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Arctic Ocean surface warming trends over the past 100 years</article-title>. <source>Geophys. Res. Lett.</source> <volume>35</volume> (<issue>2</issue>), <fpage>1</fpage>&#x2013;<lpage>6</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2007GL031651</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stroeve</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Notz</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Changing state of Arctic sea ice across all seasons</article-title>. <source>Environ. Res. Lett.</source> <volume>13</volume> (<issue>10</issue>), <fpage>103001</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1088/1748-9326/aade56</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stroeve</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Serreze</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Holland</surname> <given-names>M. M.</given-names>
</name>
<name>
<surname>Kay</surname> <given-names>J. E.</given-names>
</name>
<name>
<surname>Malanik</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Barrett</surname> <given-names>A. P.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>The Arctic&#x2019;s rapidly shrinking sea ice cover: A research synthesis</article-title>. <source>Clim. Change</source> <volume>110</volume> (<issue>3&#x2013;4</issue>), <fpage>1005</fpage>&#x2013;<lpage>1027</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10584-011-0101-1</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thanh Noi</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Kappas</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Comparison of random forest, k-nearest neighbor, and support vector machine classifiers for land cover classification using sentinel-2 imagery</article-title>. <source>Sensors</source> <volume>18</volume> (<issue>1</issue>), <elocation-id>18</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/s18010018</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vihma</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Effects of arctic sea ice decline on weather and climate: A review</article-title>. <source>Surv. Geophys.</source> <volume>35</volume> (<issue>5</issue>), <fpage>1175</fpage>&#x2013;<lpage>1214</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10712-014-9284-0</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Subseasonal forecast of Arctic sea ice concentration via statistical approaches</article-title>. <source>Clim. Dyn.</source> <volume>52</volume> (<issue>7&#x2013;8</issue>), <fpage>4953</fpage>&#x2013;<lpage>4971</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00382-018-4426-6</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Ting</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Predicting summer arctic sea ice concentration intraseasonal variability using a vector autoregressive model</article-title>. <source>J. Clim.</source> <volume>29</volume> (<issue>4</issue>), <fpage>1529</fpage>&#x2013;<lpage>1543</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/JCLI-D-15-0313.1</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Bao</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>He</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Subseasonal to seasonal Arctic sea-ice prediction: A grand challenge of climate science</article-title>. <source>Atmos. Ocean. Sci. Lett.</source> <volume>14</volume> (<issue>4</issue>), <elocation-id>100052</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.aosl.2021.100052</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>C. Y.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Seasonal arctic sea ice prediction using a newly developed fully coupled regional model with the assimilation of satellite sea ice observations</article-title>. <source>J. Adv. Model. Earth Syst.</source> <volume>12</volume> (<issue>5</issue>), <fpage>1</fpage>&#x2013;<lpage>25</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2019MS001938</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Arctic sea ice seasonal prediction by a linear Markov model</article-title>. <source>J. Clim.</source> <volume>29</volume> (<issue>22</issue>), <fpage>8151</fpage>&#x2013;<lpage>8173</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/JCLI-D-15-0858.1</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zong</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Learning k for kNN Classification</article-title>. <source>ACM Trans. Intell. Syst. Technol.</source> <volume>8</volume> (<issue>3</issue>), <fpage>43</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1145/2990508</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zong</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Efficient kNN classification with different numbers of nearest neighbors</article-title>. <source>IEEE Trans. Neural Networks Learn. Syst.</source> <volume>29</volume> (<issue>5</issue>), <fpage>1774</fpage>&#x2013;<lpage>1785</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TNNLS.2017.2673241</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>