<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Remote Sens.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Remote Sensing</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Remote Sens.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2673-6187</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1782148</article-id>
<article-id pub-id-type="doi">10.3389/frsen.2026.1782148</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Crop type mapping in the pre-Sentinel era using variable-length Landsat time-series and self-supervised learning</article-title>
<alt-title alt-title-type="left-running-head">Wijesingha and Beila</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/frsen.2026.1782148">10.3389/frsen.2026.1782148</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wijesingha</surname>
<given-names>Jayan</given-names>
</name>
<xref ref-type="aff" rid="aff1"/>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2403323"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal Analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Beila</surname>
<given-names>Ilze</given-names>
</name>
<xref ref-type="aff" rid="aff1"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
</contrib>
</contrib-group>
<aff id="aff1">
<institution>Grassland Science and Renewable Plant Resources, Faculty of Organic Agricultural Sciences, University of Kassel</institution>, <city>Witzenhausen</city>, <country country="DE">Germany</country>
</aff>
<author-notes>
<corresp id="c001">
<label>&#x2a;</label>Correspondence: Jayan Wijesingha, <email xlink:href="mailto:jayan.wijesingha@uni-kassel.de">jayan.wijesingha@uni-kassel.de</email>, <email xlink:href="mailto:gnr@uni-kassel.de">gnr@uni-kassel.de</email>
</corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-20">
<day>20</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>7</volume>
<elocation-id>1782148</elocation-id>
<history>
<date date-type="received">
<day>06</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>03</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Wijesingha and Beila.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Wijesingha and Beila</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-20">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Crop type mapping is crucial for agricultural land cover monitoring and decision-making. State-of-the-art methods developed using recent Sentinel satellite data have already demonstrated their ability to accurately map crop types. However, crop type mapping for the pre-Sentinel era remains challenging due to the limited availability of higher spatial- and temporal-resolution data. This study addresses this knowledge gap by leveraging variable-length Landsat satellite time-series (L-SITS) data in combination with a self-supervised learning model, SITS-BERT, for crop type mapping. This case study, conducted in two German districts, demonstrates the potential of mapping two different crop type levels (CTL1 - 5 and CTL2 - 9 classes) in the pre-Sentinel era. The SITS-BERT model, pre-trained on unlabelled L-SITS data, was fine-tuned on single-year and 3-year datasets and evaluated using past and future years&#x2019; data, compared with the model&#x2019;s training data. The SITS-BERT model achieved overall accuracies of 0.78&#x2013;0.83 and 0.64&#x2013;0.76 for CTL1 and CTL2, respectively, with fine-tuning on single-year data. The model fine-tuned with 3&#xa0;years achieved higher accuracies (0.81&#x2013;0.85 and 0.72&#x2013;0.78). The results showed that the SITS-BERT model finetuned with single-year data outperforms the baseline random forest model trained on single-year fixed-length L-SITS data. The study highlighted that, with this approach, limited number of available SITS observations can still be useful. The findings of this study demonstrated the potential of the SITS-BERT model with L-SITS data for crop-type mapping in the pre-Sentinel era, contributing to a more comprehensive understanding of agricultural land cover dynamics and to the evaluation of agricultural policy impacts.</p>
</abstract>
<kwd-group>
<kwd>crop mapping</kwd>
<kwd>deep learning</kwd>
<kwd>satellite image time-series (SITS)</kwd>
<kwd>SITS-BERT</kwd>
<kwd>transformers</kwd>
</kwd-group>
<funding-group>
<award-group id="gs1">
<funding-source id="sp1">
<institution-wrap>
<institution>Bundesministerium f&#xfc;r Forschung, Technologie und Raumfahrt</institution>
<institution-id institution-id-type="doi" vocab="open-funder-registry" vocab-identifier="10.13039/open_funder_registry">10.13039/501100002347</institution-id>
</institution-wrap>
</funding-source>
<award-id rid="sp1">031B1129A</award-id>
</award-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This research was funded by the German Federal Ministry of Research, Technology and Space (BMFTR) within the framework of the SYMOBIO project (grant number 031B1129A).</funding-statement>
</funding-group>
<counts>
<fig-count count="5"/>
<table-count count="5"/>
<equation-count count="0"/>
<ref-count count="27"/>
<page-count count="12"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Remote Sensing Time Series Analysis</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>Information on agricultural land cover (e.g., crop types, their extent and location) and its changes over time is crucial for well-informed policy making. Particularly, decision-makers designing, implementing and evaluating food security, agriculture, biodiversity, and climate change policies benefit from high quality spatial and temporal agricultural land cover data (<xref ref-type="bibr" rid="B5">Karthikeyan et al., 2020</xref>). Monitoring of policy impacts is crucial to avoid long-term negative effects (e.g., unsustainable practices) and, if necessary, to take appropriate corrective actions.</p>
<p>Earth observation satellite image time-series (SITS) data have been successfully applied in research and practice to detect distinct crop growth patterns and stages, and their spatial distribution. This approach helps to distinguish crop extent at different spatial scales, and crop types at various stages of their phenological cycle (<xref ref-type="bibr" rid="B26">Zeng et al., 2020</xref>). Furthermore, the increasing availability of high spatial and temporal resolution remote sensing (RS) SITS (e.g., from Sentinel or harmonised Sentinel and Landsat satellites), newly developed machine/deep learning models and hardware/software development to compute large geospatial data improved the potential of monitoring agricultural land cover in the present and past (<xref ref-type="bibr" rid="B6">Knorn et al., 2009</xref>; <xref ref-type="bibr" rid="B12">Ofori-Ampofo et al., 2021</xref>; <xref ref-type="bibr" rid="B1">Asam et al., 2022</xref>; <xref ref-type="bibr" rid="B11">Nyborg et al., 2022</xref>). The performance of currently used models strongly depends on the availability of high spatial and temporal resolution SITS data. Most state-of-the-art models employ SITS data from Sentinel 1 and 2, which have been available since 2014. However, to assess long-term policy impacts before 2014, the only available option is to use SITS based on Landsat satellite data. Landsat provides data from 1970 to the present, enabling researchers to access more than 50 years of historical satellite data. However, compared to Sentinel 2, Landsat data has lower spatial resolution (30&#xa0;m vs. 10&#xa0;m) and a lower temporal resolution (16 days instead of 5&#x2013;10 days for Sentinel).</p>
<p>Despite these limitations, researchers have demonstrated that models developed using Landsat SITS (L-SITS) data can map agricultural land cover (<xref ref-type="bibr" rid="B7">Kyere et al., 2019</xref>; <xref ref-type="bibr" rid="B22">Wijesingha et al., 2024</xref>). A random forest (RF) machine learning model trained on L-SITS data achieved 71% overall accuracy in mapping four crop types (grasslands, maize, summer crops, and winter crops) in a region of Germany (<xref ref-type="bibr" rid="B7">Kyere et al., 2019</xref>). Similarly, the same four crop types were mapped using L-SITS data and the convolutional neural network (CNN) model, achieving 90% overall accuracy (<xref ref-type="bibr" rid="B22">Wijesingha et al., 2024</xref>). Both studies used fixed time point observations as model inputs, which might have contributed to reduced accuracy.</p>
<p>Specific fixed time points (e.g., weekly, monthly) are mainly used because SITS data are limited throughout the entire crop growth period, e.g., due to the lack of cloud-free images at the required time intervals. However, most machine models (e.g., RF, CNN) can only handle fixed-length SITS. To use varying-length SITS in the abovementioned models, padding or truncation should be employed, which could alter the original data or remove necessary information (<xref ref-type="bibr" rid="B8">Lee and Shin, 2025</xref>). Alternatively, recent advanced deep learning models with transformers can be applied. These models can use variable-length SITS, avoiding the need for complex fixed-length SITS processing.</p>
<p>Transformers are a type of deep learning model, whichprimarily uses self-attention or scaled dot-product attention mechanisms, and is therefore able to handle sequences of variable lengths (<xref ref-type="bibr" rid="B19">Vaswani et al., 2017</xref>). Transformers were initially introduced for neural machine translation in natural language processing. However, nowadays, due to their multiple advantages, transformers are also employed to solve other modelling problems in computer vision or time-series data processing (<xref ref-type="bibr" rid="B21">Wen et al., 2022</xref>). For example, transformers have been used to solve time-series forecast and SITS classification problems in previously published studies (<xref ref-type="bibr" rid="B20">Voelsen et al., 2024</xref>). Further (<xref ref-type="bibr" rid="B16">Ru&#xdf;wurm and K&#xf6;rner, 2020</xref>), introduced a transformer-based approach that uses Sentinel SITS data and advanced temporal encoding to classify fourteen crop types, including fallow land. Additionally, harmonised Landsat and Sentinel 30&#xa0;m SITS were also employed with transformer-based models to detect land surface phenology (<xref ref-type="bibr" rid="B17">Tran et al., 2025</xref>) and to map the in-season 37 crop type (<xref ref-type="bibr" rid="B27">Zhang et al., 2025</xref>). However, to the best of the authors&#x2019; knowledge, no applications of transformer-based models that exclusively use L-SITS for agricultural land cover mapping have been reported.</p>
<p>Labelled data availability is another common challenge in such models. Since deep learning models with transformers are commonly supervised models, to obtain good results, they usually require large amounts of data (<xref ref-type="bibr" rid="B14">Persello et al., 2022</xref>). Self-supervised learning (SSL) is another recently emerged method that can learn from unlabelled data and therefore successfully tackle the issue of scarce training data (<xref ref-type="bibr" rid="B2">Chaves et al., 2020</xref>; <xref ref-type="bibr" rid="B9">Miller et al., 2024</xref>). The standard SSL process involves two main stages: pretraining and fine-tuning. During pretraining, models acquire initial representations by solving a predefined pretext task. In the fine-tuning stage, these representations are refined for a specific downstream task through supervised training on task-related data. This approach allows deep learning models to transfer general knowledge from large-scale, unlabelled data to tasks with limited labelled data, thereby improving their generalisation ability and reducing the risk of overfitting. The successful application of SSL methods with transformers to Sentinel SITS data has already been reported by (<xref ref-type="bibr" rid="B25">Yuan and Lin, 2021</xref>; <xref ref-type="bibr" rid="B24">Xu et al., 2024</xref>).</p>
<p>Despite promising results, the SITS-based agricultural land cover mapping still has limitations in terms of model transferability across different temporal (e.g., years) and spatial (e.g., other regions) domains, as well as across spatial-temporal domains. The recent study by the authors assessed changes in model performance during transfer across different temporal and spatio-temporal domains (<xref ref-type="bibr" rid="B22">Wijesingha et al., 2024</xref>). L-SITS data for mapping of four crop types (grassland, maize, summer crops and winter crops) were used. Results showed that model performance decreased when the trained model was transferred to another temporal domain, and the performance was further reduced during spatial and spatio-temporal transfer. To overcome this problem, multi-year or multi-location data can be used for model training. It enables the model to understand multiple data distributions. In addition, a recent study showed that a transformer-based deep learning model with an advanced temporal encoding method could accurately transfer models trained with single-year data to another year (i.e., temporal transferability) (<xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>). In that study, harmonised Landsat and Sentinel 2 SITS were used. The study employed high density SITS using currently available satellite data. This approach, however, does not solve the identified issues of L-SITS data models.</p>
<p>In light of these challenges, this study addresses the following research question: Can L-SITS data and recently developed transformer-based models using SSL methods effectively map crop types, thereby contributing to agricultural land cover mapping efforts in pre-Sentinel era periods (before 2014)? To answer this question, this work aims to;<list list-type="order">
<list-item>
<p>Develop a crop type mapping SSL model with L-SITS data</p>
</list-item>
<list-item>
<p>Compare model performance using variable-length L-SITS data versus fixed-length SITS data</p>
</list-item>
<list-item>
<p>Investigate how the temporal transferability of these models changes by using different training data (single year versus multi-year training data)</p>
</list-item>
</list>
</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2-1">
<label>2.1</label>
<title>Study area</title>
<p>This study was conducted in two districts of the Weser-Ems region in the federal state of Lower Saxony in Germany (see <xref ref-type="fig" rid="F1">Figure 1</xref>). The two selected districts are: a) Ammerland (DE496) and b) Vechta (DE49F). The Ammerland district is located in the northwestern part of the Weser-Ems region and covers an area of approximately 73,064&#xa0;km<sup>2</sup>. In 2019, the total agricultural area in Ammerland was 41,593&#xa0;km<sup>2</sup>, which accounts for 57% of the district&#x2019;s total area. More than 55% of the agricultural area in this district is covered by grassland, primarily used as forage for dairy cattle. The Vechta district is located in the western part of the Weser-Ems region and covers an area of 81,422&#xa0;km<sup>2</sup>. Similar to Ammerland, about 59% of Vechta&#x2019;s area is dedicated to agriculture. However, in Vechta, the share of grassland area was lower (11%) than in Ammerland. The most dominant crop types in Vechta were maize and winter cereals.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>
<bold>(a)</bold> Location of study area in Germany with German federal state boundaries and Corine land cover classes for the year 2018 (<xref ref-type="bibr" rid="B3">CLC Service, 2023</xref>) for <bold>(b)</bold> Ammerland and <bold>(c)</bold> Vechta districts.</p>
</caption>
<graphic xlink:href="frsen-07-1782148-g001.tif">
<alt-text content-type="machine-generated">Three-panel figure showing land cover in Germany. Panel a maps Germany&#x2019;s major cities and highlights two study areas in red. Panels b and c display detailed land cover categories for these study areas, using colors to indicate features such as sealed areas, forest cover, vegetation, and water. A color legend clarifies each land cover type.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s2-2">
<label>2.2</label>
<title>Data</title>
<sec id="s2-2-1">
<label>2.2.1</label>
<title>Crop field data</title>
<p>The polygons of the crop field boundary and the crop type for each field were obtained from integrated administration and control system (IACS) data from the Ministry of Food, Agriculture and Consumer Protection of Lower Saxony between 2010 and 2018 for the whole Weser-Ems region. Due to heterogeneous crop types data (more than 200 crop types were recorded), this study grouped the types of crops into two different levels: a) crop type level 1 (CTL1) - basic types, and b) crop type level 2 (CTL2) - advanced level. In CTL1, all crop types were categorised into four major categories: permanent grassland, summer crops, winter crops, and others. Nine crop types were considered in the crop type level 2 (CTL2). The summary of the crop type levels categorisation is tabulated in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Crop type classification for both crop type levels (CTL1 and CTL2).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Crop type level 1 (CTL1)</th>
<th align="left">Crop type level 2 (CTL2)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">C1 &#x2013; Permanent grassland</td>
<td align="left">C11 &#x2013; Permanent grassland (pastures, meadows)</td>
</tr>
<tr>
<td rowspan="2" align="left">C2 &#x2013; Summer crop</td>
<td align="left">C21 &#x2013; Maize (grain, silage)</td>
</tr>
<tr>
<td align="left">C22 &#x2013; Summer cereal (barley, wheat)</td>
</tr>
<tr>
<td rowspan="2" align="left">C3 &#x2013; Winter crop</td>
<td align="left">C31 &#x2013; Winter wheat</td>
</tr>
<tr>
<td align="left">C32 &#x2013; Winter cereal (barley, rye)</td>
</tr>
<tr>
<td rowspan="4" align="left">C4 &#x2013; Other</td>
<td align="left">C41 &#x2013; Oil seed (rapeseed, sunflower)</td>
</tr>
<tr>
<td align="left">C42 &#x2013; Permanent crop (orchard)</td>
</tr>
<tr>
<td align="left">C43 &#x2013; Root crop/vegetables (carrot, potato)</td>
</tr>
<tr>
<td align="left">C44 &#x2013; Mixed (field fodder, quiescence)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2-2-2">
<label>2.2.2</label>
<title>Landsat satellite image time-series (L-SITS)</title>
<p>L-SITS data (<xref ref-type="bibr" rid="B18">U.S. Geological Survey, 2025</xref>) from 2010, 2011 and 2013 to 2018 for the two districts were acquired and pre-processed using the Google Earth Engine&#x2019;s Python API (<xref ref-type="bibr" rid="B4">Gorelick et al., 2017</xref>; <xref ref-type="bibr" rid="B23">Wu, 2020</xref>; <xref ref-type="bibr" rid="B10">Montero, 2021</xref>). Data for 2012 could not be obtained due to extensive cloud cover in the satellite images, and 2012 was excluded from further assessment. Each annual L-SITS contained all available images (from Landsat 5, 7, and 8 satellites) between March (01.03) and October (31.10). Even though there are differences between spectral responses for each corresponding band from three Landsat satellites, the Collection-2 Level-2 surface reflectance data were downloaded which systematically corrected to minimise these variations (Landsat images courtesy of the U.S. Geological Survey). Following the methodologies by (<xref ref-type="bibr" rid="B22">Wijesingha et al., 2024</xref>), from each image data (after cloud masking and scaling) of six spectral bands (blue, green, red, near-infrared1, shortwave-infrared1, and B7:shortwave-infrared2) and four vegetation indices (VIs) (normalised vegetation index&#x2013;NDVI, enhanced vegetation index&#x2013;EVI, optimised soil-adjusted vegetation index&#x2013;OSAVI, and normalised difference moisture index&#x2013;NDMI) were considered and extracted (equations for Vis are mentioned in the <xref ref-type="sec" rid="s12">Supplementary Material</xref>). The size of the crop fields was calculated based on the crop field boundaries. Crop fields with a size less than 0.9&#xa0;ha (less than 10 Landsat pixels) were excluded from the study. The mean band reflectance or VI value for each crop field polygon was extracted. For each crop field polygon, the extracted L-SITS data included a time-series of all available time points, Landsat reflectance bands, VI data, and the image acquisition date.</p>
</sec>
</sec>
<sec id="s2-3">
<label>2.3</label>
<title>Models</title>
<sec id="s2-3-1">
<label>2.3.1</label>
<title>Self-supervised learning (SSL) model</title>
<p>This study employed the SSL deep learning model previously developed by (<xref ref-type="bibr" rid="B25">Yuan and Lin, 2021</xref>), which was already utilised for land use, land cover, and crop type mapping using Sentinel SITS. In this model, variable-length SITS data with its time point are inserted as a one-dimensional array. First, the model was pre-trained with available SITS data without using any labels. Then, the pre-trained model was finetuned with available labels. During pre-training, the model learned specific spectral-temporal features of the SITS data, which enabled it to perform downstream tasks accurately with few labels. The model was an extension of bidirectional encoder representations from transformers (BERT), a remarkable SSL model in natural language processing (NLP). The modified BERT model to classify the SITS data was referred to as the SITS-BERT model (<xref ref-type="bibr" rid="B25">Yuan and Lin, 2021</xref>). The whole network consisted of two parts: a) an observation embedding layer and b) a standard transformer encoder. The observation embedding layer contained observations with the corresponding time encoded using positional encoding. The time information was provided as day of the year (DoY) to facilitate model transferability across multiple years. The transformer encoder comprises various stacked transformer blocks. A single transformer block consisted of a multi-head attention layer and a position-wise fully connected feed-forward network. More details about SITS-BERT can be found in the original article by (<xref ref-type="bibr" rid="B25">Yuan and Lin, 2021</xref>).</p>
<p>Pre-training of the SITS-BERT model was designed to do a predesigned pretext task: &#x201c;some of the input observations are randomly chosen and added with noise, and then the model is forced to predict&#x201d; (<xref ref-type="bibr" rid="B25">Yuan and Lin, 2021</xref>). The model can learn temporal connections between observations by solving this pretext task. According to the authors of the original SITS-BERT publication, the model was pre-trained to reconstruct the original, uncorrupted values of perturbed data using SITS, leveraging contextual information from the remaining sequence. During pre-training, the model optimisation objective was the mean-squared error between the predicted value of the corrupted data and its corresponding actual value. The SITS-BERT model in this study was pre-trained using only variable-length L-SITS data (6 bands and 4 VIs) and with respective DoY from 5&#xa0;years (2011, 2013, 2014, 2016, and 2017). The model pre-training was done according to the given configuration (max length &#x3d; 64, number of features &#x3d; 10, validation rate &#x3d; 3%, batch size &#x3d; 256, number of attention heads &#x3d; 8, learning rate &#x3d; 0.0001) (<xref ref-type="bibr" rid="B25">Yuan and Lin, 2021</xref>). After pretraining, the model was fine-tuned for the time-series classification task&#x2014;a process commonly referred to as fine-tuning. To do so, an additional output layer was added to the model. The original model was imported from the <ext-link ext-link-type="uri" xlink:href="https://github.com/linlei1214/SITS-BERT">https://github.com/linlei1214/SITS-BERT</ext-link>.</p>
</sec>
<sec id="s2-3-2">
<label>2.3.2</label>
<title>Random forest (RF) model</title>
<p>The RF model served as the baseline model in this study to compare the performance of the SITS-BERT model. The RF models have been widely employed for crop type classification using SITS data and evaluated for their spatial and temporal transferability (<xref ref-type="bibr" rid="B13">Orynbaikyzy et al., 2022</xref>; <xref ref-type="bibr" rid="B22">Wijesingha et al., 2024</xref>). However, as a shallow/traditional machine learning model, the RF model requires fixed-length time-series data as input. Following the methods explained by (<xref ref-type="bibr" rid="B22">Wijesingha et al., 2024</xref>), the variable-length L-SITS data were converted to the fixed-length time-series by calculating median values for each bi-month (four observations per time-series&#x2013;March-April, May-June, July-August, and September-October). Each L-SITS consisted of 40 observations (10 VIs or spectral bands &#xd7; 4 time points). The mean NDVI bi-monthly time-series for CTL2 crops are shown in <xref ref-type="sec" rid="s12">Supplementary Appendix Figure A1</xref> of the <xref ref-type="sec" rid="s12">Supplementary Material</xref> as an example.</p>
</sec>
</sec>
<sec id="s2-4">
<label>2.4</label>
<title>Model experiments</title>
<p>This study conducted several experiments to understand the influence of the amount of training data and the temporal transferability of the trained model over various years. Considering the training data, two experiment cases were carried out: a) Case I&#x2013;models were trained using only single-year L-SITS data (2015 data), and b) Case II&#x2013;models were trained with multi-year L-SITS data (2014, 2015, and 2016). Regarding the trained models&#x2019; temporal transferability, two transferability scenarios were evaluated: a) Scenario I&#x2013;trained models were tested with the L-SITS data from 2010 to 2011, and b) Scenario II&#x2013;trained models were tested with the L-SITS data from 2017 to 2018. In Scenario I, the model transferability over the past years was tested, and in Scenario II, the model transferability for future years was checked.</p>
<p>The SITS-BERT and baseline RF models were evaluated for all defined experiment cases and model transferability scenarios. However, due to the rebuilding of fixed-length L-SITS data from variable-length L-SITS data, the number of data points and time-series observations used in the model and test data differed between the RF and SITS-BERT models (<xref ref-type="table" rid="T2">Table 2</xref>), as data for some fixed time points were unavailable.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>The size of training and testing data sets (number of data points) in two different models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">Training data &#x2013; Case I</th>
<th align="center">Training data &#x2013; Case II</th>
<th align="center">Test data &#x2013; Scenario I</th>
<th align="center">Test data &#x2013; Scenario II</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">SITS-BERT</td>
<td align="center">28,176</td>
<td align="center">84,139</td>
<td align="center">57,458</td>
<td align="center">54,923</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">24,076</td>
<td align="center">79,799</td>
<td align="center">56,610</td>
<td align="center">52,217</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Each experiment case (Case I and II) with model transferability scenarios (Scenario I and II) was evaluated by computing a confusion matrix using predicted and actual values for both class levels (CTL1 and CTL2). Based on the confusion matrix, four model performance evaluation metrics (<xref ref-type="table" rid="T3">Table 3</xref>) were derived: OA- overall accuracy (Equation 1), Pr - precision (Equation 2), Rc - recall (Equation 3, and F1 - F1-score (Equation 4). The Pr, Rc, and F1 were calculated at the class level. Due to uneven class distribution, each class-level metric (Pr, Rc, and F1) was summarised by calculating a weighted average, with the number of samples per class as the weight. Because the test data had different numbers of observations across the two models, the comparison was based on a similar number of observations from the RF model. That means a model comparison was based on 56,610 observations in Scenario I and 52,217 observations in Scenario II. However, to get an indication of the SITS-BERT model transferability, model performance metrics for the remaining observations were also computed. To do this, SITS-BERT model performances were calculated based on 848 samples and 2,706 samples for Scenarios I and II, respectively. Finally, to understand the SITS-BERT model performance behaviour with varying numbers of time-series observations, the OA values were summarised for each scenario based on the number of time-series observations per sample.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Equations and descriptions of the evaluation metrics. (Where <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the number of true positives, <inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the number of false positives, <inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the number of false negatives for the class <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> respectively, and <inline-formula id="inf5">
<mml:math id="m5">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the number of classes).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Metric</th>
<th align="center">Equation</th>
<th align="center">Description</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Overall accuracy (OA)</td>
<td align="center">
<inline-formula id="inf6">
<mml:math id="m6">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>A</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>S</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula> &#x2009;(1)</td>
<td align="center">The proportion of correctly classified samples among all tested samples</td>
</tr>
<tr>
<td align="center">Precision (Pr)</td>
<td align="center">
<inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="italic">Pr</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula> &#x2009;(2)</td>
<td align="center">In each class, the proportion of predicted positives that were positive</td>
</tr>
<tr>
<td align="center">Recall (Rc)</td>
<td align="center">
<inline-formula id="inf8">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula> &#x2009;(3)</td>
<td align="center">In each class, the proportion of actual positives that were correctly predicted</td>
</tr>
<tr>
<td align="center">F1 score (F1)</td>
<td align="center">
<inline-formula id="inf9">
<mml:math id="m9">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>Pr</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>Pr</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mi>c</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula> &#x2009;(4)</td>
<td align="center">The harmonic mean of precision and recall</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To understand the variations in SITS-BERT model predictions with respect to the number of L-SITS observations, the percentage of accurately predicted data points was calculated for each observation group per CTL type and scenario. The SITS-BERT model experimental results notebooks are at <ext-link ext-link-type="uri" xlink:href="https://github.com/jmatics/L-SITS-BERT/tree/master/LSITS">https://github.com/jmatics/L-SITS-BERT/tree/master/LSITS</ext-link>.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<label>3</label>
<title>Results</title>
<sec id="s3-1">
<label>3.1</label>
<title>Crop type distribution</title>
<p>The median number of crop fields per year from the two districts was 27,482. The lowest number of crop fields was in 2015 (24,076), and the highest was in 2010 (28,939). However, the distribution of crop classes varied between the two regions, whereas the frequency of crop types within the same region over the years did not show substantial variation (<xref ref-type="fig" rid="F2">Figure 2</xref>). About 50% of the crop fields in Ammerland were permanent grasslands (C11). Compared to Ammerland, the share of permanent grassland fields in Vectha was only 13%. Maize (C21) was the most dominant crop type in Vechta, at about 40%, and in Ammerland at 28%. About 13% of crop fields in Vechta were winter wheat (C31), and another 20% of fields were other winter cereals (C32). However, the proportion of winter wheat (C31) and winter cereals (C32) in Ammerland was 1% and 5%, respectively. The share of oilseed crop fields (C41) was 0.4% and 1.3% in Ammerland and Vechta, respectively. About 4% of crop fields in Ammerland were permanent crops (C42), and root crops and vegetables (C43) - in Vectha. In both districts, the crop type group &#x201c;mixed&#x201d; (C44) showed varying proportions of crop fields across years.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Crop type distribution in two districts between 2010 and 2018 (except 2012).</p>
</caption>
<graphic xlink:href="frsen-07-1782148-g002.tif">
<alt-text content-type="machine-generated">Stacked bar chart comparing yearly ratios of different crop parcel types from 2010 to 2018 in Ammerland and Vechta regions, with maize and permanent grassland dominant in Ammerland, and maize, winter cereals, and wheat more prominent in Vechta.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-2">
<label>3.2</label>
<title>SITS-BERT model pretraining</title>
<p>The SITS-BERT model was pre-trained on all L-SITS and DoY data from 5&#xa0;years without crop type label data. The model was pre-trained for 50 epochs. The best model was obtained at the 49th epoch and was used for the downstream tasks. The mean square error loss for the best model training was 0.01639; for the validation, it was 0.01356.</p>
</sec>
<sec id="s3-3">
<label>3.3</label>
<title>Variable-length Landsat SITS</title>
<sec id="s3-3-1">
<label>3.3.1</label>
<title>Training data (Case I and Case II)</title>
<p>The pretrained SITS-BERT models were finetuned under two Case experiments. Under Case I, the models were trained using single-year data, whereas Case II employed data from three consecutive years (2014, 2015, and 2016). The training data from Case I contained 28,176 observations, and they had variable-length data with five to fifteen observations (<xref ref-type="fig" rid="F3">Figure 3</xref>). Most of the data points (about 31%) contained 9 observations each. The data with 10 and 8 observations were 24% and 19%, respectively. The minimum number of data points was either 5 or 15 (0.1%). Compared to Case I, 3&#xa0;years of data from Case II contained from five to 25 observations (<xref ref-type="fig" rid="F3">Figure 3</xref>). The total number of training data in Case II was 84,139, with 28,278 from 2014, 28,176 from 2015, to 27,685 from 2016. Of all the training data, 14% each contained 10 and 11 observations. Notably, the data from 2015 to 2016 only had observations between 5 and 15. Conversely, the 2014 data consisted of observations ranging from 10 to 25.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>The distribution of the number of Landsat observations in the variable-length satellite time-series for the model fine-tuning cases: <bold>(a)</bold> Case I - using a single year (2015) data only, and <bold>(b)</bold> Case II - using 3&#xa0;years (2014, 2015, and 2016) data.</p>
</caption>
<graphic xlink:href="frsen-07-1782148-g003.tif">
<alt-text content-type="machine-generated">Two side-by-side bar charts compare training data distributions. Chart A for Case I shows a unimodal distribution peaking at around ten observations, while chart B for Case II displays a bimodal distribution with peaks near twelve and twenty observations. Both charts label the x-axis as number of observations and the y-axis as frequency.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-3-2">
<label>3.3.2</label>
<title>Test data (Scenario I and Scenario II)</title>
<p>Similar to the training data distribution under Cases I and II, the test data distribution in Scenarios I and II also differed (<xref ref-type="fig" rid="F4">Figure 4</xref>). In Scenario I, the SITS-BERT model was evaluated using data from 2010 to 2011, comprising 57,458 data points. These data ranged from 6 to 16 observations. Data points with 13 observations were the most frequent, accounting for approximately 25% (8,253 in 2010 and 5,895 in 2011). The 2017 and 2018 data were used in Scenario II for model evaluation, comprising 54,923 data points. Those data points contained observations ranging from three to 24. However, the dataset had 11 and 18 observations, which were the most common, comprising 22% of the data points (11% each from the 11 and 18 observations).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>The distribution of the number of Landsat observations in the variable-length satellite time-series for testing <bold>(a)</bold> Scenario I (2010 and 2011) and <bold>(b)</bold> Scenario II (2017 and 2018).</p>
</caption>
<graphic xlink:href="frsen-07-1782148-g004.tif">
<alt-text content-type="machine-generated">Bar chart comparing two scenarios labeled Scenario I and Scenario II under the heading Test Data. Scenario I shows a single-peaked distribution centered near twelve, while Scenario II displays a bimodal distribution with peaks near eleven and nineteen. Both plots use frequency as the y-axis and number of observations as the x-axis.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="s3-4">
<label>3.4</label>
<title>Models trained with single-year data (Case I)</title>
<p>During the Case I experiments, both pretrained SITS-BERT and the RF models were trained on single-year data (2015), and the models were transferred to predict values (both CTL1 and CTL2) in two scenarios (Scenario I and II).</p>
<p>In both Scenarios, the SITS-BERT model under Case I with CTL1 outperformed the RF model in all evaluation metrics (<xref ref-type="table" rid="T4">Table 4</xref>). The SITS-BERT model&#x2019;s OA and weighted F1 score in Scenario I (0.833 and 0.826) were better than in Scenario II (0.784 and 0.785). A similar pattern of accuracy metrics was observed in the RF model, with slightly lower values: weighted F1 was 0.764 (OA &#x3d; 0.752) and 0.740 (OA &#x3d; 0.724) for Scenarios I and II, respectively. The SITS-BERT model performance was also calculated for the remaining observations, as the two models were compared with a similar number of observations. Based on the remaining observations, the SITS-BERT model achieved OA of 0.742 and weighted F1 of 0.718 for CTL1 in Scenario I. Under Scenario II, the remaining observations with the SITS-BERT model achieved an OA of 0.730 and a weighted F1 of 0.724.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Model performance summary for Case I (fine-tuned with single year data). Bold text highlights the best performance for each Scenario and crop type level.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Class levels</th>
<th align="left">Scenario levels</th>
<th align="left">Model</th>
<th align="center">OA</th>
<th align="center">Weighted precision</th>
<th align="center">Weighted recall</th>
<th align="center">Weighted F1</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="6" align="left">CTL1</td>
<td rowspan="3" align="left">Scenario I</td>
<td align="left">SITS-BERT</td>
<td align="center">
<bold>0.833</bold>
</td>
<td align="center">
<bold>0.825</bold>
</td>
<td align="center">
<bold>0.833</bold>
</td>
<td align="center">
<bold>0.826</bold>
</td>
</tr>
<tr>
<td align="left">RF</td>
<td align="center">0.752</td>
<td align="center">0.804</td>
<td align="center">0.752</td>
<td align="center">0.764</td>
</tr>
<tr>
<td align="left">SITS-BERT (remaining)</td>
<td align="center">0.742</td>
<td align="center">0.724</td>
<td align="center">0.742</td>
<td align="center">0.718</td>
</tr>
<tr>
<td rowspan="3" align="left">Scenario II</td>
<td align="left">SITS-BERT</td>
<td align="center">
<bold>0.784</bold>
</td>
<td align="center">
<bold>0.810</bold>
</td>
<td align="center">
<bold>0.784</bold>
</td>
<td align="center">
<bold>0.785</bold>
</td>
</tr>
<tr>
<td align="left">RF</td>
<td align="center">0.724</td>
<td align="center">0.802</td>
<td align="center">0.724</td>
<td align="center">0.740</td>
</tr>
<tr>
<td align="left">SITS-BERT (remaining)</td>
<td align="center">0.730</td>
<td align="center">0.750</td>
<td align="center">0.730</td>
<td align="center">0.724</td>
</tr>
<tr>
<td rowspan="6" align="left">CTL2</td>
<td rowspan="3" align="left">Scenario I</td>
<td align="left">SITS-BERT</td>
<td align="center">
<bold>0.759</bold>
</td>
<td align="center">
<bold>0.753</bold>
</td>
<td align="center">
<bold>0.759</bold>
</td>
<td align="center">
<bold>0.739</bold>
</td>
</tr>
<tr>
<td align="left">RF</td>
<td align="center">0.702</td>
<td align="center">
<bold>0.757</bold>
</td>
<td align="center">0.702</td>
<td align="center">0.704</td>
</tr>
<tr>
<td align="left">SITS-BERT (remaining)</td>
<td align="center">0.693</td>
<td align="center">0.700</td>
<td align="center">0.693</td>
<td align="center">0.658</td>
</tr>
<tr>
<td rowspan="3" align="left">Scenario II</td>
<td align="left">SITS-BERT</td>
<td align="center">0.644</td>
<td align="center">0.715</td>
<td align="center">0.644</td>
<td align="center">0.640</td>
</tr>
<tr>
<td align="left">RF</td>
<td align="center">
<bold>0.652</bold>
</td>
<td align="center">
<bold>0.738</bold>
</td>
<td align="center">
<bold>0.652</bold>
</td>
<td align="center">
<bold>0.673</bold>
</td>
</tr>
<tr>
<td align="left">SITS-BERT (remaining)</td>
<td align="center">0.670</td>
<td align="center">0.670</td>
<td align="center">0.670</td>
<td align="center">0.652</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>When the models were trained to predict more crop types (CTL2), both models showed slightly lower performance. Under Scenario I, the SITS-BERT model clearly outperformed the RF model, with a weighted F1 score of 0.739 (OA &#x3d; 0.759) compared to 0.704 (OA &#x3d; 0.702) for the RF model. Compared to the RF model, the SITS-BERT model yielded better evaluation metric values under Scenario II. However, as with the CTL1 prediction models, the performance of both models decreased slightly in Scenario II compared to Scenario I. The OA values for the remaining observations with the SITS-BERT model for CTL2 were 0.693 (F1 &#x3d; 0.658) and 0.670 (F1 &#x3d; 0.652), respectively, for Scenarios I and II.</p>
</sec>
<sec id="s3-5">
<label>3.5</label>
<title>Models trained with multi-year data (Case II)</title>
<p>During the Case II experiments, both SITS-BERT and the RF models were trained using multi-year (2014, 2015, and 2016) data. The models were then transferred to predict values (both CTL1 and CTL2) in two scenarios (Scenario I and II).</p>
<p>Compared to the models&#x2019; performances in Case I, both models showed improved results in Case II (<xref ref-type="table" rid="T5">Table 5</xref>). However, in CTL1 prediction under Scenario I, the SITS-BERT model indicated higher OA (0.855 vs. 0.844) and weighted F1 (0.848 vs. 0.841), whereas the RF models achieved better OA (0.835 vs. 0.807) and weighted F1 (0.838 vs. 0.812) in Scenario II. The OA values from the SITS-BERT model for the remaining observations were 0.756 (F1 &#x3d; 0.737) and 0.821 (F1 &#x3d; 0.820) for Scenarios I and II, respectively.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Model performance summary for Case II (fine-tuned with 3&#xa0;years data). Bold text highlights the best performance for each Scenario and crop type level.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Class levels</th>
<th align="center">Scenario levels</th>
<th align="center">Model</th>
<th align="center">OA</th>
<th align="center">Weighted precision</th>
<th align="center">Weighted recall</th>
<th align="center">Weighted F1</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="6" align="center">CTL1</td>
<td rowspan="3" align="center">Scenario I</td>
<td align="center">SITS-BERT</td>
<td align="center">
<bold>0.855</bold>
</td>
<td align="center">
<bold>0.846</bold>
</td>
<td align="center">
<bold>0.855</bold>
</td>
<td align="center">
<bold>0.848</bold>
</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">0.844</td>
<td align="center">0.841</td>
<td align="center">0.844</td>
<td align="center">0.841</td>
</tr>
<tr>
<td align="center">SITS-BERT (remaining)</td>
<td align="center">0.756</td>
<td align="center">0.739</td>
<td align="center">0.756</td>
<td align="center">0.737</td>
</tr>
<tr>
<td rowspan="3" align="center">Scenario II</td>
<td align="center">SITS-BERT</td>
<td align="center">0.807</td>
<td align="center">0.844</td>
<td align="center">0.807</td>
<td align="center">0.812</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">
<bold>0.835</bold>
</td>
<td align="center">
<bold>0.845</bold>
</td>
<td align="center">
<bold>0.835</bold>
</td>
<td align="center">
<bold>0.838</bold>
</td>
</tr>
<tr>
<td align="center">SITS-BERT (remaining)</td>
<td align="center">0.821</td>
<td align="center">0.828</td>
<td align="center">0.821</td>
<td align="center">0.820</td>
</tr>
<tr>
<td rowspan="6" align="center">CTL2</td>
<td rowspan="3" align="center">Scenario I</td>
<td align="center">SITS-BERT</td>
<td align="center">0.771</td>
<td align="center">
<bold>0.805</bold>
</td>
<td align="center">0.771</td>
<td align="center">0.762</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">
<bold>0.789</bold>
</td>
<td align="center">0.789</td>
<td align="center">
<bold>0.789</bold>
</td>
<td align="center">
<bold>0.769</bold>
</td>
</tr>
<tr>
<td align="center">SITS-BERT (remaining)</td>
<td align="center">0.708</td>
<td align="center">0.731</td>
<td align="center">0.708</td>
<td align="center">0.689</td>
</tr>
<tr>
<td rowspan="3" align="center">Scenario II</td>
<td align="center">SITS-BERT</td>
<td align="center">0.725</td>
<td align="center">
<bold>0.816</bold>
</td>
<td align="center">0.725</td>
<td align="center">0.731</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">
<bold>0.771</bold>
</td>
<td align="center">0.773</td>
<td align="center">
<bold>0.771</bold>
</td>
<td align="center">
<bold>0.766</bold>
</td>
</tr>
<tr>
<td align="center">SITS-BERT (remaining)</td>
<td align="center">0.749</td>
<td align="center">0.769</td>
<td align="center">0.749</td>
<td align="center">0.743</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The model prediction for the CTL2 in Case II indicated that the RF models (OA &#x3d; 0.789 and 0.771 for the two Scenarios) were better than the SITS-BERT model (OA &#x3d; 0.771 and 0.725 for the two Scenarios). Based on the remaining observations, the SITS-BERT model obtained an OA of 0.708 and a weighted F1 of 0.689 in Scenario I. Under Scenario II, the remaining observation predictions with the SITS-BERT model achieved an OA of 0.749 and a weighted F1 score of 0.743. The confusion matrices for each model are summarised in the Supplementary Material (<xref ref-type="sec" rid="s12">Supplementary Appendix Figures A1&#x2013;A8</xref>).</p>
</sec>
<sec id="s3-6">
<label>3.6</label>
<title>SITS-BERT model accuracy per number of observations</title>
<p>The percentage of prediction accuracy for CTL1 and CTL2 under Scenarios I and II in Case I is provided in <xref ref-type="fig" rid="F5">Figure 5</xref>. In CTL1 Scenario I, the data with six observations had the lowest percentage (67%), while all other data with more than six observations obtained more than 80% accuracy. For Scenario II, the data with three, four, and five observations obtained 60%, 45%, and 70% accuracy, respectively. However, the data with more than 7 observations achieved more than 70% accuracy. Similar to the overall model performance, CTL2 in Scenarios I and II showed lower accuracy values for varying observations. For Scenario II, the data with six observations again yielded the lowest accuracy (67%) for CTL2, while all other data, ranging from seven to sixteen observations, achieved accuracies greater than 75%, except for the data with ten observations (74%). Considering Scenario II, the data with 15 observations provided the lowest accuracy (49%). Further, the data with four, five, sixteen, seventeen, eighteen, nineteen, and twenty observations obtained accuracies below 60%. At both crop type levels (CTL1 and CTL2) and across Scenarios, the highest accuracy was achieved with the data set with the largest number of observations.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Impact of the number of Landsat observations in the variable-length time-series on the accuracy in both Scenarios and fine-tuning Cases.</p>
</caption>
<graphic xlink:href="frsen-07-1782148-g005.tif">
<alt-text content-type="machine-generated">Bar chart with four panels comparing the percentage of accurately predicted data versus number of Landsat observations for CTL1 and CTL2, under Scenario I and Scenario II, with values generally higher in Scenario I.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<label>4</label>
<title>Discussion</title>
<p>In this study, the application of recently developed transformer-based deep learning models with SSL for crop type mapping using L-SITS data was explored. The results of this study showed that the L-SITS data, combined with the SITS-BERT model, could accurately predict both simple (CLT1) and advanced (CLT2) crop types. Furthermore, the findings demonstrated that fine-tuning of the pre-trained SITS-BERT model with 3&#xa0;years data provided better results compared to using single-year data.</p>
<sec id="s4-1">
<label>4.1</label>
<title>L-SITS data</title>
<p>This study explored the application of solely L-SITS data from 2010 to 2018 for crop type classification. During that period, Landsat 5 data were available until 2011, and Landsat 7 data were available from 1999 (till 2024) (<xref ref-type="bibr" rid="B18">U.S. Geological Survey, 2025</xref>). The Landsat 8 data have been available since 2013 (<xref ref-type="bibr" rid="B18">U.S. Geological Survey, 2025</xref>). As a result, in 2012, Landsat 7 data were the only available source, leading to limited cloud-free data availability and preventing the use of 2012 data in the study area. In all other years of the assessment, at least two Landsat satellite datasets were available to generate L-SITS data for each year. This ensured having the maximum temporal observations for the L-SITS data. Compared to the current variable-length SITS applications using Sentinel 1, 2, or a combination of Landsat and Sentinel 2 (<xref ref-type="bibr" rid="B2">Chaves et al., 2020</xref>). The L-SITS data explored in this study had a lower temporal resolution. Although L-SITS data have lower temporal resolution, variable-length L-SITS data showed potential for crop type mapping in Germany, which would be beneficial for areas or periods without Sentinel data. When it comes to crop type mapping before 2010, with the suggested model, SITS data from at least two Landsat satellites (either Landsat 4 and 5 or Landsat 5 and 7) can be used. Therefore, it enables crop type mapping going back to the 1980s.</p>
<p>Moreover, this study demonstrated that over 245 days (from March to October), a minimum of five and a maximum of 25 temporal observations could be obtained for a variable-length L-SITS in different regions within the study area. For example, a single L-SITS had five observations at 81, 105, 217, 232, and 272 DoY (March 22, April 15, August 5, August 20, and September 29). However, based on this example, we can see that even with fewer observations, the L-SITS data have well-distributed time-series within the main crop-growth season. This outcome is helpful for tasks that require differentiation of crop types based on their phenological patterns. Moreover, with very few observations, the prediction accuracy did not show a substantial reduction (<xref ref-type="fig" rid="F5">Figure 5</xref>), further supporting the application of the SITS-BERT model for crop type mapping using L-SITS data. In contrast, the results for Scenario II indicated that L-SITS with 15 observations produced (<xref ref-type="fig" rid="F5">Figure 5</xref>) the lowest correctly classified percentage (for CTL2). Further examination of the L-SITS dataset with 15 observations revealed that one incorrectly predicted example included five observations from July, with no observations at the beginning or end of the time-series and no observations from June. Such behaviour highlights a potential limitation of the model, indicating the need for further fine-tuning and the incorporation of novel adaptations, such as temporal encoding (<xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>), to better capture temporal dependencies within the time-series.</p>
</sec>
<sec id="s4-2">
<label>4.2</label>
<title>Application of SITS-BERT with L-SITS data</title>
<p>This study is one of the first attempts to explore the SSL method with variable-length L-SITS data for crop type mapping. Considering this, the SITS-BERT model was pre-trained using 5&#xa0;years of variable-length L-SITS data without labels. As mentioned before, the SITS-BERT model was introduced with the application of the Sentinel-2 SITS data by (<xref ref-type="bibr" rid="B25">Yuan and Lin, 2021</xref>). This study attempted to reimplement a similar model using L-SITS data. Compared to the original version with Sentinel data, this study also incorporated a similar pretext task during model pre-training to leverage the advantage of extensive unlabelled data.</p>
<p>The pre-trained SITS-BERT model was then fine-tuned using two different training datasets: a single year (Case I) and a multi&#x2013;year (Case II) dataset. The single-year training dataset consistently showed a minimum accuracy of 0.644 for CTL-2 in future years (Scenario II). Compared to that, the multi-year training dataset achieved a minimum accuracy of 0.725 for the same scenario, representing an approximately 16% increase. Compared with the original work using Sentinel 2 data, these accuracy values were substantially lower (<xref ref-type="bibr" rid="B25">Yuan and Lin, 2021</xref>). However, when it comes to CTL2 predicting for the past years (Scenario I), both single-year and multi-year training cases showed similar performance (0.759 and 0.771 of OA). These results were better than those obtained by (<xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>) using Landsat 5 and 7 data with temporal encoding to the irregular time-series. This indicated that the application of L-SITS data with the SITS-BERT model could be a potential tool for predicting crop types before the Sentinel era, overcoming challenges encountered by (<xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>).</p>
<p>The baseline model used in this study was the RF model trained on fixed-length L-SITS data. The fine-tuned SITS-BERT model with variable-length L-SITS data outperformed the RF model with fixed-length L-SITS when trained on single-year data. This was a significant advantage when there was not enough labelled data to train the model. On the other hand, due to the fixed-length L-SITS, the number of data points used for training and testing the RF model was mainly lower than that of the SITS-BERT model. The increased number of data points improved the performance of the SITS-BERT model. Under Case I, the RF model was trained with 17% fewer observations than the SITS-BERT model. However, in Case II, only 5% fewer observations were used in the RF model, and the differences in model performance were not substantial.</p>
</sec>
<sec id="s4-3">
<label>4.3</label>
<title>Simple vs. advanced crop type classification</title>
<p>This study examined two different crop types (CTL1 and CTL2) at two distinct levels and evaluated model performance across both levels. The CTL1 contained simple crop type groups, which comprised broader crop categories. The SITS-BERT model with both cases (Case I and Case II) consistently showed higher OA values than the baseline RF model (<xref ref-type="table" rid="T4">Tables 4</xref>, <xref ref-type="table" rid="T5">5</xref>). The winter crops (C3) showed the highest class-level F1 (Case I &#x3d; 0.909 and Case II &#x3d; 0.941). These results were better than this study&#x2019;s baseline RF model results (F1 was 0.877 and 0.926) and findings from (<xref ref-type="bibr" rid="B22">Wijesingha et al. (2024)</xref> for winter crops using fixed-length L-SITS data with the RF and the CNN models transferred to another temporal domain (F1 was between 0.83 and 0.90). This also confirmed that broader crop type classification could benefit from variable-length L-SITS and SITS-BERT models.</p>
<p>The complex crop type labels were included in CTL2; thus, both SITS-BERT and baseline RF models underperformed compared to CTL1. Similar to all the results, however, the SITS-BERT model predictions for Scenario I (for years 2010 and 2011) showed higher OA compared to Scenario II (for years 2017 and 2018) (<xref ref-type="table" rid="T4">Table 4</xref>). However, results reported by (<xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>) indicated higher model performances for later years (OA was 86.4 and 90.9 for 2017 and 2018) than for past years (OA was 61.9 and 62.8 for 2010 and 2011) for 14 crop types using temporally encoded SITS data. This again confirms that the application of the SITS-BERT model with variable-length L-SITS data is effective for past crop type mapping tasks, including those with complex crop classes.</p>
<p>The STIS-BERT model&#x2019;s capability to separate maize (C21) from other summer cereals (C22) was substantially higher, where the maize F1 scores for Scenario I were 0.893 and 0.933 for Cases I and II, respectively. These F1 scores for maize were higher than the results reported by (<xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>; <xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>), where temporally encoded SITS data were used to predict crop type in the years 2010 (F1 &#x3d; 0.8) and 2011 (F1 &#x3d; 0.9) (similar to Scenario I). However, when separating winter wheat (C31) from other winter cereals (C32), models performed poorly in both scenarios. A possible reason for this performance could be the class distribution of the data. In the study regions, the number of fields with maize was significantly higher than that of summer cereals, enabling the model to identify distinct patterns in maize&#x2019;s SITS data compared to those of summer cereals. On the other hand, the proportion of winter wheat compared to winter cereals was lower (especially in the Ammerland district). A similar pattern of results was reported by (<xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>), though the models in this study were trained with similar class observations, yet the winter cereals (wheat, barley, and rye) reported 0.6 as an average F1 score.</p>
<p>The SITS-BERT model predictions for the complex crop categories, such as oil seeds (C41), permanent crops (C42), and root crops and vegetables (C43), clearly indicated that when the model was trained with multiple years, the predictability of these classes increased compared to a model trained with a single year of data. Among these crop classes, C42 showed the best performance (F1 score&#x2265;0.5) in both Scenarios (using the Case I and II models), though most of the C42 data was available in the district of Ammerland. The C41 class had an F1 score of more than 0.55 for the models in Case II. However, these class performances were lower than the F1-scores for separate classes of rapeseed and sunflower (&#x3e;0.6) from the models with temporally encoded SITS data (<xref ref-type="bibr" rid="B15">Pham et al., 2024</xref>). The class C43 was a complex class that combined root crops and vegetables. The decision to merge root crops and vegetables into the C43 class was made to increase the number of data points per class to reduce the impact of the class imbalance. However, this grouping led to a decrease in prediction accuracy due to the complexity of phenological and morphological characteristics of both crop types. This outcome suggests that a standard approach is necessary when defining crop classes for SITS data, as simply increasing sample size does not overcome fundamental differences between crop types and the class imbalance problem.</p>
</sec>
</sec>
<sec sec-type="conclusion" id="s5">
<label>5</label>
<title>Conclusion</title>
<p>This study evaluated the application of recently developed transformer-based deep learning models with SSL for crop type mapping using variable-length L-SITS for the pre-Sentinel era. The results clearly demonstrated that variable-length L-SITS extracted from available cloud-free data points can still be useful for crop-type or other mapping tasks when used with the SITS-BERT model. Similarly, the pre-trained SITS-BERT model could be finetuned with single-year data (fewer data points) and achieved reasonable accuracies for both simple (CTL1) and advanced (CTL2) crop type mapping. These results were better than those of the baseline RF model, which was trained on fixed-length L-SITS data. This is a significant advantage in cases where there is insufficient labelled data to train the model. Further, fine-tuning with multi-year data also improved model performance. The study also investigated the impact of the number of L-SITS observations on the accuracy of the SITS-BERT model for variable-length L-SITS data. The results showed that even with a small number of observations, prediction accuracy did not decline substantially. The model evaluation also assessed the SITS-BERT model&#x2019;s predictions for past and future years relative to its training years to evaluate its generalisability across different temporal domains, and this study&#x2019;s results showed somewhat better performance for past years than for future years. Overall, the use of variable-length L-SITS data with the SITS-BERT model enables the application of L-SITS data for crop-type mapping dating back to the 1980s.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>The data analyzed in this study is subject to the following licenses/restrictions: The Landsat data is available to download through respective sources (e.g., USGS Earth Explorer or Google Earth Engine), but the crop type data (polygons of fields) are restricted to share. Requests to access these datasets should be directed to jayan.wijesingha@uni-kassel.de.</p>
</sec>
<sec sec-type="author-contributions" id="s7">
<title>Author contributions</title>
<p>JW: Data curation, Visualization, Software, Formal Analysis, Methodology, Investigation, Validation, Writing &#x2013; original draft, Conceptualization. IB: Writing &#x2013; review and editing, Project administration, Data curation, Conceptualization.</p>
</sec>
<ack>
<title>Acknowledgements</title>
<p>The authors sincerely thank Prof. Dr. Michael Wachendorf for providing the facilities and support necessary to carry out this research. We would like to thank the Ministry of Agriculture of Lower Saxony, Germany, for providing historical agricultural land use (IACS) data for the training and validation of the models.</p>
</ack>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s10">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s12">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/frsen.2026.1782148/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/frsen.2026.1782148/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Asam</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gessner</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Gonz&#xe1;lez</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Wenzl</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kriese</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kuenzer</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Mapping crop types of Germany by combining temporal statistical metrics of Sentinel-1 and Sentinel-2 time series with LPIS data</article-title>. <source>Remote Sens. (Basel).</source> <volume>14</volume>. <pub-id pub-id-type="doi">10.3390/rs14132981</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chaves</surname>
<given-names>M. E. D.</given-names>
</name>
<name>
<surname>Picoli</surname>
<given-names>M. C. A.</given-names>
</name>
<name>
<surname>Sanches</surname>
<given-names>I. D.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Recent applications of landsat 8/OLI and Sentinel-2/MSI for land use and land cover mapping: a systematic review</article-title>. <source>Remote Sens. (Basel).</source> <volume>12</volume>. <pub-id pub-id-type="doi">10.3390/rs12183062</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="book">
<collab>CLC Service</collab> (<year>2023</year>). <source>CLCplus backbone 2018 (raster 10 m)</source>, <volume>Europe</volume>. <pub-id pub-id-type="doi">10.2909/cd534ebf-f553-42f0-9ac1-62c1dc36d32c</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gorelick</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Hancher</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dixon</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ilyushchenko</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Thau</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Google Earth Engine: planetary-scale geospatial analysis for everyone</article-title>. <source>Remote Sens. Environ.</source> <volume>202</volume>, <fpage>18</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2017.06.031</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Karthikeyan</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chawla</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Mishra</surname>
<given-names>A. K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A review of remote sensing applications in agriculture for food security: crop growth and yield, irrigation, and crop losses</article-title>. <source>J. Hydrol. (Amst).</source> <volume>586</volume>, <fpage>124905</fpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2020.124905</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Knorn</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Rabe</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Radeloff</surname>
<given-names>V. C.</given-names>
</name>
<name>
<surname>Kuemmerle</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Kozak</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hostert</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Land cover mapping of large areas using chain classification of neighboring landsat satellite images</article-title>. <source>Remote Sens. Environ.</source> <volume>113</volume>, <fpage>957</fpage>&#x2013;<lpage>964</lpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2009.01.010</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kyere</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Astor</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gra&#xdf;</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wachendorf</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Multi-temporal agricultural land-cover mapping using single-year and multi-year models based on landsat imagery and IACS data</article-title>. <source>Agronomy</source> <volume>9</volume>, <fpage>13</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.3390/agronomy9060309</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Shin</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Beyond information distortion: imaging variable-length time series data for classification</article-title>. <source>Sensors</source> <volume>25</volume>, <fpage>621</fpage>. <pub-id pub-id-type="doi">10.3390/s25030621</pub-id>
<pub-id pub-id-type="pmid">39943260</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Miller</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Pelletier</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Webb</surname>
<given-names>G. I.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Deep learning for satellite image time-series analysis: a review</article-title>. <source>IEEE Geosci. Remote Sens. Mag.</source> <volume>12</volume>, <fpage>81</fpage>&#x2013;<lpage>124</lpage>. <pub-id pub-id-type="doi">10.1109/MGRS.2024.3393010</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Montero</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Eemont: a python package that extends google Earth engine</article-title>. <source>J. Open Source Softw.</source> <volume>6</volume>, <fpage>3168</fpage>. <pub-id pub-id-type="doi">10.21105/joss.03168</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nyborg</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pelletier</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lef&#xe8;vre</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Assent</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>TimeMatch: unsupervised cross-region adaptation by temporal shift estimation</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>188</volume>, <fpage>301</fpage>&#x2013;<lpage>313</lpage>. <pub-id pub-id-type="doi">10.1016/j.isprsjprs.2022.04.018</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ofori-Ampofo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pelletier</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lang</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Crop type mapping from optical and radar time series using attention-based deep learning</article-title>. <source>Remote Sens. (Basel).</source> <volume>13</volume>, <fpage>1</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.3390/rs13224668</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Orynbaikyzy</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gessner</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Conrad</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Spatial transferability of random forest models for crop type classification using Sentinel-1 and Sentinel-2</article-title>. <source>Remote Sens. (Basel).</source> <volume>14</volume>, <fpage>1493</fpage>. <pub-id pub-id-type="doi">10.3390/rs14061493</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Persello</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Wegner</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Hansch</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Tuia</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Ghamisi</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Koeva</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Deep learning and Earth observation to support the sustainable development goals: current approaches, open challenges, and future opportunities</article-title>. <source>IEEE Geosci. Remote Sens. Mag.</source> <volume>10</volume>, <fpage>172</fpage>&#x2013;<lpage>200</lpage>. <pub-id pub-id-type="doi">10.1109/MGRS.2021.3136100</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pham</surname>
<given-names>V.-D.</given-names>
</name>
<name>
<surname>Tetteh</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Thiel</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Erasmi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Schwieder</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Frantz</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Temporally transferable crop mapping with temporal encoding and deep learning augmentations</article-title>. <source>Int. J. Appl. Earth Observation Geoinformation</source> <volume>129</volume>, <fpage>103867</fpage>. <pub-id pub-id-type="doi">10.1016/j.jag.2024.103867</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ru&#xdf;wurm</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>K&#xf6;rner</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Self-attention for raw optical satellite time series classification</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>169</volume>, <fpage>421</fpage>&#x2013;<lpage>435</lpage>. <pub-id pub-id-type="doi">10.1016/j.isprsjprs.2020.06.006</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tran</surname>
<given-names>K. H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H. K.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>A transformer-based model for detecting land surface phenology from the irregular harmonized landsat and Sentinel-2 time series across the United States</article-title>. <source>Remote Sens. Environ.</source> <volume>320</volume>, <fpage>114656</fpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2025.114656</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="web">
<collab>U.S. Geological Survey</collab> (<year>2025</year>). <article-title>Landsat missions</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="https://www.usgs.gov/landsat-missions">https://www.usgs.gov/landsat-missions</ext-link> (Accessed October 24, 2025)</comment>.</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Vaswani</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Shazeer</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Parmar</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Uszkoreit</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gomez</surname>
<given-names>A. N.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Attention is all you need</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/1706.03762">http://arxiv.org/abs/1706.03762</ext-link> (Accessed May 22, 2025).</comment>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Voelsen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rottensteiner</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Heipke</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Transformer models for land cover classification with satellite image time series</article-title>. <source>PFG - J. Photogrammetry, Remote Sens. Geoinformation Sci.</source> <volume>92</volume>, <fpage>547</fpage>&#x2013;<lpage>568</lpage>. <pub-id pub-id-type="doi">10.1007/s41064-024-00299-7</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Wen</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Transformers in time series: a survey</article-title>. <comment>Available online at: <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/2202.07125">http://arxiv.org/abs/2202.07125</ext-link> (Accessed May 22, 2025).</comment>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wijesingha</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Dzene</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Wachendorf</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Evaluating the spatial&#x2013;temporal transferability of models for agricultural land cover mapping using landsat archive</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>213</volume>, <fpage>72</fpage>&#x2013;<lpage>86</lpage>. <pub-id pub-id-type="doi">10.1016/j.isprsjprs.2024.05.020</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Geemap: a python package for interactive mapping with google Earth engine</article-title>. <source>J. Open Source Softw.</source> <volume>5</volume>, <fpage>2305</fpage>. <pub-id pub-id-type="doi">10.21105/joss.02305</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Self-supervised pre-training for large-scale crop mapping using Sentinel-2 time series</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>207</volume>, <fpage>312</fpage>&#x2013;<lpage>325</lpage>. <pub-id pub-id-type="doi">10.1016/j.isprsjprs.2023.12.005</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Self-supervised pretraining of transformers for satellite image time series classification</article-title>. <source>IEEE J. Sel. Top. Appl. Earth Obs. Remote Sens.</source> <volume>14</volume>, <fpage>474</fpage>&#x2013;<lpage>487</lpage>. <pub-id pub-id-type="doi">10.1109/JSTARS.2020.3036602</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zeng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wardlow</surname>
<given-names>B. D.</given-names>
</name>
<name>
<surname>Xiang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A review of vegetation phenological metrics extraction using time-series, multispectral satellite data</article-title>. <source>Remote Sens. Environ.</source> <volume>237</volume>, <fpage>111511</fpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2019.111511</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>H. K.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>Robust and timely within-season conterminous United States crop type mapping using landsat Sentinel-2 time series and the transformer architecture</article-title>. <source>Remote Sens. Environ.</source> <volume>329</volume>, <fpage>114950</fpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2025.114950</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1165816/overview">Peter Potapov</ext-link>, World Resources Institute, United States</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/811072/overview">Ahmad Khan</ext-link>, University of Maryland, College Park, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3347540/overview">Haijun Li</ext-link>, University of Maryland, College Park, United States</p>
</fn>
</fn-group>
</back>
</article>