<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Sports Act. Living</journal-id>
<journal-title>Frontiers in Sports and Active Living</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Sports Act. Living</abbrev-journal-title>
<issn pub-type="epub">2624-9367</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fspor.2025.1661456</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Sports and Active Living</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Technical classification of professional cycling stages using unsupervised learning: implications for performance variability</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author"><name><surname>Garcia-Atutxa</surname><given-names>Igor</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x2020;</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/2778734/overview"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Dudagoitia Barrio</surname><given-names>Ekaitz</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x2020;</sup></xref><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Villanueva-Flores</surname><given-names>Francisca</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2778636/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
</contrib-group>
<aff id="aff1"><label><sup>1</sup></label><institution>Escuela Polit&#x00E9;cnica Superior, Universidad Cat&#x00F3;lica de Murcia (UCAM)</institution>, <addr-line>Murcia</addr-line>, <country>Spain</country></aff>
<aff id="aff2"><label><sup>2</sup></label><institution>University of Murcia</institution>, <addr-line>Murcia</addr-line>, <country>Spain</country></aff>
<aff id="aff3"><label><sup>3</sup></label><institution>Centro de Investigaci&#x00F3;n en Ciencia Aplicada y Tecnolog&#x00ED;a Avanzada, Instituto Polit&#x00E9;cnico Nacional</institution>, <addr-line>Atlacholoaya, Morelos,</addr-line> <country>Mexico</country></aff>
<author-notes>
<fn fn-type="edited-by"><p><bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1592369/overview">Ant&#x00F3;nio Miguel Monteiro</ext-link>, Instituto Polit&#x00E9;cnico de Bragan&#x00E7;a, Portugal</p></fn>
<fn fn-type="edited-by"><p><bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/761146/overview">Pedro Forte</ext-link>, Higher Institute of Educational Sciences of the Douro, Portugal</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1564232/overview">Jos&#x00E9; Eduardo Teixeira</ext-link>, Instituto Polit&#x00E9;cnico da Guarda, Portugal</p></fn>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Francisca Villanueva-Flores <email>fvillanuevaf@ipn.mx</email></corresp>
<fn fn-type="other" id="fn001"><label><sup>&#x2020;</sup></label><p>ORCID Igor Garcia-Atutxa <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0009-0002-1551-2685">orcid.org/0009-0002-1551-2685</ext-link> Ekaitz Dudagoitia Barrio <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0003-0990-3081">orcid.org/0000-0003-0990-3081</ext-link> Francisca Villanueva-Flores <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0001-6092-4211">orcid.org/0000-0001-6092-4211</ext-link></p></fn>
</author-notes>
<pub-date pub-type="epub"><day>15</day><month>10</month><year>2025</year></pub-date>
<pub-date pub-type="collection"><year>2025</year></pub-date>
<volume>7</volume><elocation-id>1661456</elocation-id>
<history>
<date date-type="received"><day>07</day><month>07</month><year>2025</year></date>
<date date-type="accepted"><day>22</day><month>09</month><year>2025</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2025 Garcia-Atutxa, Dudagoitia Barrio and Villanueva-Flores.</copyright-statement>
<copyright-year>2025</copyright-year><copyright-holder>Garcia-Atutxa, Dudagoitia Barrio and Villanueva-Flores</copyright-holder><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><sec><title>Introduction</title>
<p>In professional cycling, the technical characteristics of race stages significantly influence group dynamics and performance variability among competitors. However, stage classifications have traditionally been subjective, lacking a robust empirical foundation. This study aimed to develop an objective, technical classification of professional cycling stages using unsupervised learning (KMeans) and analyze how these categories relate to collective performance variability, measured by the coefficient of variation (CV) of finish times.</p>
</sec><sec><title>Methods</title>
<p>Technical data and official results from 439 international race stages conducted between 2017 and 2023 were analyzed. The technical variables included distance, total vertical gain, average relative elevation, and percentages of paved and unpaved surfaces.</p>
</sec><sec><title>Results</title>
<p>Cluster validation via Bootstrap analysis demonstrated high stability (mean silhouette index&#x2009;&#x003D;&#x2009;0.62&#x2009;&#x00B1;&#x2009;0.03), confirming six clearly distinct technical stage groups. Results indicated that stages characterized by higher relative elevation and greater proportions of unpaved surfaces exhibited higher performance variability (higher CV),whereas less technically demanding stages showed lower variability; relative elevation emerged as the strongest predictor of CV (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.42, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), followed by unpaved percentage (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.23, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.01), distance (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.18, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.05), and vertical gain (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.11, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.05). Across 2017&#x2013;2023, a broadly downward pattern in CV was observed, although a pooled linear-trend test with cluster fixed effects did not reach statistical significance (<italic>p</italic>&#x2009;&#x003D;&#x2009;0.315).</p>
</sec><sec><title>Discussion</title>
<p>The lack of physiological data and possible confounding from unmeasured stage and team factors (e.g., weather, stage order, team tactics) limit causal inference. This empirical typology provides a valuable quantitative tool to optimize competitive strategies, plan targeted training based on stage type, and prevent cumulative fatigue and performance-related injuries in high-performance cycling. Future research incorporating direct physiological data is recommended to further explore the relationship between external and internal load in professional cycling.</p>
</sec>
</abstract>
<kwd-group>
<kwd>professional cycling</kwd>
<kwd>unsupervised learning</kwd>
<kwd>clustering</kwd>
<kwd>performance variability</kwd>
<kwd>external load</kwd>
</kwd-group><contract-num rid="cn001">SIP20242814</contract-num><contract-sponsor id="cn001">Instituto Polit&#x00E9;cnico Nacional</contract-sponsor><contract-sponsor id="cn002">Direcci&#x00F3;n de Investigaci&#x00F3;n: Convocatoria de Apoyos econ&#x00F3;micos para Publicaciones y Tr&#x00E1;mite de Invenciones</contract-sponsor><counts>
<fig-count count="5"/>
<table-count count="2"/><equation-count count="0"/><ref-count count="31"/><page-count count="9"/><word-count count="0"/></counts><custom-meta-wrap><custom-meta><meta-name>section-at-acceptance</meta-name><meta-value>Elite Sports and Performance Enhancement</meta-value></custom-meta></custom-meta-wrap>
</article-meta>
</front>
<body><sec id="s1" sec-type="intro"><label>1</label><title>Introduction</title>
<p>Professional road cycling is an endurance sport marked by considerable technical and physiological complexity. Cycling stages exhibit substantial variation in factors such as total distance, accumulated elevation gain, average gradient, and terrain composition (<xref ref-type="bibr" rid="B1">1</xref>&#x2013;<xref ref-type="bibr" rid="B3">3</xref>). These technical characteristics significantly shape the tactical strategies employed by teams and directly influence the physiological distribution and collective performance dynamics within the peloton (<xref ref-type="bibr" rid="B4">4</xref>).</p>
<p>Traditionally, cycling stages have been classified into broad categories such as &#x201C;flat&#x201D;, &#x201C;mountainous&#x201D;, or &#x201C;time trial&#x201D;. However, this conventional classification tends to be subjective and often lacks empirical precision, potentially overlooking relevant technical combinations observed in actual racing conditions (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>). Recent studies have highlighted that objective technical variables, such as accumulated elevation, relative elevation per kilometer, and surface composition, critically impact muscular fatigue, sustainable power output, and recovery between consecutive efforts in professional cycling (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B8">8</xref>). These variables define the &#x201C;external load&#x201D;, a central concept in performance physiology that determines the intensity and specificity of physical demands during prolonged competitions (<xref ref-type="bibr" rid="B9">9</xref>&#x2013;<xref ref-type="bibr" rid="B11">11</xref>).</p>
<p>Recently, researchers have paid attention to how these technical characteristics affect not only individual performance but also the cohesion and collective durability of group performance during stage races (<xref ref-type="bibr" rid="B12">12</xref>). This variability may increase the risk of fatigue-related injuries and highlight the need for better strategic adaptation (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>).</p>
<p>In parallel, recent advances in data science and machine learning algorithms have revolutionized methodologies for classifying and analyzing sports data. Clustering methods, in particular, enable empirical classification of sports events based on objective data patterns, offering more precise and reproducible typologies than traditional classifications (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>). Beyond cycling, unsupervised learning has been increasingly applied across endurance sports. For example, in running to identify technique-based subgroups and their relation to running economy (<xref ref-type="bibr" rid="B17">17</xref>), in collegiate cross-country cohorts using hierarchical clustering to profile mechanics and risk factors (<xref ref-type="bibr" rid="B18">18</xref>), and in swimming to partition inertial measurement unit (IMU)-derived functional data into skill-related patterns (<xref ref-type="bibr" rid="B19">19</xref>), thereby broadening the methodological context relevant to our approach. In cycling, the application of these methodologies remains limited, though initial studies have demonstrated their potential to generate empirically grounded typologies of cycling stages, thus facilitating improved strategic planning and more effective training load management (<xref ref-type="bibr" rid="B20">20</xref>).</p>
<p>Nevertheless, despite the practical relevance of the relationship between objective technical stage classifications and variability in collective performance, this connection has received limited empirical exploration in recent sports literature. The coefficient of variation (CV) of finish times emerges as a key indicator for assessing how specific technical features affect peloton performance homogeneity or dispersion (<xref ref-type="bibr" rid="B21">21</xref>, <xref ref-type="bibr" rid="B22">22</xref>).</p>
<p>Therefore, the primary objective of this study is to develop an empirical and objective classification of professional cycling stages using unsupervised learning methods, and to evaluate how these technical categories relate to collective performance dispersion, measured through the CV of finish times. The central hypothesis of this research is that stages with higher technical demands (high elevation, mixed surfaces) are significantly associated with greater collective performance dispersion, reflecting increased physiological and tactical fatigue.</p>
<p>This study provides a robust quantitative framework useful for strategic and physiological planning in professional cycling, directly contributing to the optimization of specific training approaches, the prevention of cumulative fatigue-related injuries, and an improved understanding of how external technical loads influence the internal physiological dynamics of professional cyclists. Practically, this typology helps coaches, sports scientists, and teams tailor stage-type&#x2013;specific training, pacing/fueling, and roster/equipment choices, while anticipating fatigue to minimize performance decrements and injury risk across multi-stage races.</p>
</sec>
<sec id="s2" sec-type="methods"><label>2</label><title>Materials and methods</title>
<p><xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref> summarizes the analysis pipeline: data (2017&#x2013;2023); rule-based QC/preprocessing (completeness, duplicate/neutralized removal, plausibility bounds); outlier screening via the IQR rule with conservative handling of missing entries; z-score standardization (StandardScaler) and collinearity checks (VIF); K-means clustering with optimal k by silhouette and stability by bootstrap (1,000 resamples); small-cluster rule (<italic>n</italic>&#x2009;&#x003C;&#x2009;5, descriptive only); PCA visualization; and statistical analyses interpretation and reporting.</p>
<fig id="F1" position="float"><label>Figure 1</label>
<caption><p>Methodological workflow. Data, QC/preprocessing, outliers/missing data, standardization/collinearity, clustering, small-cluster rule (<italic>n</italic>&#x2009;<italic>&#x003C;</italic>&#x2009;5; descriptive only), PCA, analysis and reporting.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1661456-g001.tif"><alt-text content-type="machine-generated">Flowchart detailing a data analysis process. It begins with \"Data (2017-2023)\" leading to \"QC and preprocessing,\" followed by \"Outliers and missing\" and \"Standardize and collinearity.\" It then goes to \"Clustering\" with arrows pointing back to \"Small-cluster rule: n &#x003C; 5\" and then to \"Visualization: PCA.\" Finally, it advances to \"Statistical analyses, Interpretation and reporting.\"</alt-text>
</graphic>
</fig>
<sec id="s2a"><label>2.1</label><title>Study design</title>
<p>This retrospective study applied advanced statistical analysis and machine learning techniques to develop an objective and empirical classification of professional cycling stages. The dataset was derived from the publicly available &#x201C;Geospatial Road Cycling Race Results Data Set&#x201D; (<xref ref-type="bibr" rid="B23">23</xref>), which includes official race outcomes and technical details of stages from 2017 to 2023. The original data collection and validation procedures have been thoroughly described, ensuring analytical integrity and reliability for this study.</p>
</sec>
<sec id="s2b"><label>2.2</label><title>Data selection and analyzed variables</title>
<p>Data corresponding to 439 professional cycling stages from international races held between 2017 and 2023 were analyzed. Following the protocols and methodology described in (<xref ref-type="bibr" rid="B23">23</xref>), specific technical variables considered relevant according to recent literature were selected for analysis:
<list list-type="simple">
<list-item><label>&#x2022;</label>
<p>Total distance (km): Official distance covered in each stage.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Total vertical gain (m): Accumulated elevation gained throughout the stage.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Average relative elevation (m/km): Average gradient calculated by dividing total elevation gain by total distance.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Paved percentage (&#x0025;): Proportion of the stage run on paved surfaces.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Unpaved percentage (&#x0025;): Proportion of the stage run on technical unpaved surfaces.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Performance CV: Coefficient of variation (CV&#x2009;&#x003D;&#x2009;SD/mean) of official finishing times across all classified riders (DNF/DSQ excluded), selected as a scale-invariant proxy that increases as the peloton fragments physiologically or tactically (e.g., breakaways, crosswinds, selective climbs), widening time gaps.</p></list-item>
</list></p>
</sec>
<sec id="s2c"><label>2.3</label><title>Statistical procedures and analytical techniques</title>
<p>All analyses were run in Python 3.10 (scikit-learn 1.4.2, pandas 2.2.2, NumPy 1.26.4, Matplotlib 3.9.2). Statistical significance was assessed at <italic>&#x03B1;</italic>&#x2009;&#x003D;&#x2009;0.05 (two-sided).</p>
<sec id="s2c1"><label>2.3.1</label><title>Preprocessing</title>
<p>We applied a rule-based pipeline to ensure data quality and internal validity: retained stages with complete values for all modelling variables (Section <xref ref-type="sec" rid="s2b">2.2</xref>) and an official finish time; removed duplicates; excluded neutralized or cancelled stages; and enforced plausibility bounds (e.g., strictly positive distance and time). Outliers were flagged using the interquartile-range rule (values &#x003C;Q1&#x2009;&#x2212;&#x2009;1.5&#x2009;&#x00D7;&#x2009;IQR or &#x003E;Q3&#x2009;&#x002B;&#x2009;1.5&#x2009;&#x00D7;&#x2009;IQR) and excluded if they violated pre-specified plausibility constraints or source metadata. Missingness was minimal: distance and finish times (for CV computation) were complete, except in cases of disqualification/withdrawal. Missing entries in total vertical gain and in road-surface composition (paved/unpaved &#x0025;) were imputed as zero under a conservative assumption.</p>
</sec>
<sec id="s2c2"><label>2.3.2</label><title>Collinearity and scaling</title>
<p>Multicollinearity among technical predictors was examined via variance inflation factors (VIFs); all VIFs were below conventional thresholds, so no remedial action was required. Predictors were z-scored (StandardScaler) to equalize scales before analysis. Clusters with fewer than five stages were summarized descriptively and excluded from between-cluster inferential tests due to unreliable within-cluster variance (<italic>n</italic>&#x2009;&#x2264;&#x2009;4) or its absence (<italic>n</italic>&#x2009;&#x003D;&#x2009;1).</p>
</sec>
<sec id="s2c3"><label>2.3.3</label><title>Clustering and validation</title>
<p>Stages were classified with K-means to obtain an objective technical typology (<xref ref-type="bibr" rid="B24">24</xref>). The number of clusters (k) was selected using the silhouette coefficient (range &#x2212;1&#x2013;1), computed with Euclidean distances on standardized features (<xref ref-type="bibr" rid="B25">25</xref>). Cluster stability was assessed by bootstrapping (1,000 resamples); the average silhouette across resamples exceeded 0.5, indicating stable separation.</p>
</sec>
<sec id="s2c4"><label>2.3.4</label><title>Visualization and complementary analyses</title>
<p>Principal component analysis (PCA) was used solely for low-dimensional visualization of cluster structure (<xref ref-type="bibr" rid="B26">26</xref>). Complementary analyses included: (i) ordinary least squares of annual mean CV on calendar year (2017&#x2013;2023) to assess temporal trend; (ii) multiple linear regression of CV on standardized technical variables to quantify their partial associations; and (iii) descriptive comparisons of CV across clusters using boxplots and summary statistics (mean, SD).</p>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results"><label>3</label><title>Results</title>
<sec id="s3a"><label>3.1</label><title>Technical classification of cycling stages through unsupervised clustering</title>
<p>The application of the unsupervised KMeans clustering algorithm allowed the identification of six clearly distinct technical groups among the analyzed professional cycling stages. Visualization of these groups using PCA demonstrated clear separation, reflecting high internal coherence and strong external differentiation among the obtained clusters (<xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref>).</p>
<fig id="F2" position="float"><label>Figure 2</label>
<caption><p>Two-dimensional PCA visualization illustrating the separation and distribution of the six technical clusters identified by the KMeans algorithm. Each point represents an individual cycling stage, with colors indicating the assigned technical cluster.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1661456-g002.tif"><alt-text content-type="machine-generated">Scatter plot depicting data points distributed across six clusters, each represented by different colors: blue, orange, green, red, purple, and brown. The x-axis is labeled \"Principal Component 1\" and the y-axis is \"Principal Component 2\". Clusters are visually distinct but some overlap is evident, with the majority clustered around the origin.</alt-text>
</graphic>
</fig>
<p>It is noteworthy that cluster 4 contains a single stage, indicating that this represents an exceptional and technically extreme case within the dataset. This single record is characterized by an especially high combination of relative elevation, distance, and a significant percentage of unpaved surface, clearly distinguishing it from the remaining clusters. Due to its uniqueness and limited statistical representation, this cluster will be excluded from subsequent comparative analyses to ensure the methodological validity and stability of the obtained results. Nevertheless, the practical and sporting relevance of this exceptional stage type suggests that future studies using larger datasets and incorporating additional analyses, including direct physiological variables, would be necessary to fully evaluate its implications for performance and strategic planning in professional cycling.</p>
<p>The five primary clusters were named according to their predominant technical characteristics to facilitate practical interpretation:
<list list-type="simple">
<list-item><label>&#x2022;</label>
<p>Cluster 0 (Flat homogeneous stages): Flat profile with short distance, low relative elevation, and high proportion of paved surfaces.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Cluster 1 (Medium-endurance stages): Stages of moderate to long distance, intermediate elevation, predominantly paved.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Cluster 2 (Long mountainous stages): Stages with high distance, significant relative elevation, and mixed paved terrain.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Cluster 3 (Short mixed-profile stages): Short stages with intermediate profiles, moderate elevation, and predominantly paved surfaces.</p></list-item>
<list-item><label>&#x2022;</label>
<p>Cluster 5 (Extreme technical stages): Long stages with very high relative elevation and a significant proportion of unpaved surfaces.</p></list-item>
</list></p>
</sec>
<sec id="s3b"><label>3.2</label><title>Average technical characteristics per cluster</title>
<p>The average technical characterization of each cluster identified specific stage profiles (<xref ref-type="table" rid="T1">Table&#x00A0;1</xref>). Stages grouped into clusters 2 and 5 presented the most demanding technical conditions, characterized by high relative elevation, significant distance, and substantial proportions of unpaved surfaces. In contrast, clusters 0 and 3 featured less demanding technical conditions, with lower elevation and a higher proportion of paved surfaces.</p>
<table-wrap id="T1" position="float"><label>Table 1</label>
<caption><p>Average technical characteristics and standard deviation (SD) for the five selected clusters.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Cluster</th>
<th valign="top" align="center">Distance (km)</th>
<th valign="top" align="center">Vertical gain (m)</th>
<th valign="top" align="center">Elevation (m/km)</th>
<th valign="top" align="center">Paved (&#x0025;)</th>
<th valign="top" align="center">Unpaved (&#x0025;)</th>
<th valign="top" align="center">CV</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">0</td>
<td valign="top" align="center">120&#x2009;&#x00B1;&#x2009;15</td>
<td valign="top" align="center">500&#x2009;&#x00B1;&#x2009;120</td>
<td valign="top" align="center">4.2&#x2009;&#x00B1;&#x2009;1.1</td>
<td valign="top" align="center">98&#x2009;&#x00B1;&#x2009;2</td>
<td valign="top" align="center">2&#x2009;&#x00B1;&#x2009;1</td>
<td valign="top" align="center">0.58&#x2009;&#x00B1;&#x2009;0.04</td>
</tr>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="center">160&#x2009;&#x00B1;&#x2009;20</td>
<td valign="top" align="center">1,800&#x2009;&#x00B1;&#x2009;200</td>
<td valign="top" align="center">11.2&#x2009;&#x00B1;&#x2009;1.8</td>
<td valign="top" align="center">90&#x2009;&#x00B1;&#x2009;3</td>
<td valign="top" align="center">10&#x2009;&#x00B1;&#x2009;2</td>
<td valign="top" align="center">0.75&#x2009;&#x00B1;&#x2009;0.04</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="center">200&#x2009;&#x00B1;&#x2009;25</td>
<td valign="top" align="center">3,000&#x2009;&#x00B1;&#x2009;250</td>
<td valign="top" align="center">15.0&#x2009;&#x00B1;&#x2009;2.0</td>
<td valign="top" align="center">85&#x2009;&#x00B1;&#x2009;4</td>
<td valign="top" align="center">15&#x2009;&#x00B1;&#x2009;3</td>
<td valign="top" align="center">0.89&#x2009;&#x00B1;&#x2009;0.04</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="center">80&#x2009;&#x00B1;&#x2009;10</td>
<td valign="top" align="center">600&#x2009;&#x00B1;&#x2009;100</td>
<td valign="top" align="center">7.5&#x2009;&#x00B1;&#x2009;1.3</td>
<td valign="top" align="center">95&#x2009;&#x00B1;&#x2009;2</td>
<td valign="top" align="center">5&#x2009;&#x00B1;&#x2009;2</td>
<td valign="top" align="center">0.66&#x2009;&#x00B1;&#x2009;0.07</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="center">190&#x2009;&#x00B1;&#x2009;25</td>
<td valign="top" align="center">4,000&#x2009;&#x00B1;&#x2009;300</td>
<td valign="top" align="center">21.1&#x2009;&#x00B1;&#x2009;2.9</td>
<td valign="top" align="center">70&#x2009;&#x00B1;&#x2009;6</td>
<td valign="top" align="center">30&#x2009;&#x00B1;&#x2009;5</td>
<td valign="top" align="center">0.85&#x2009;&#x00B1;&#x2009;0.06</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn1"><p>Values expressed as mean&#x2009;&#x00B1;&#x2009;standard deviation.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3c"><label>3.3</label><title>Performance variability by technical cluster</title>
<p>Collective performance variability, measured using CV of finishing times, showed significant differences according to technical stage categories. More technically demanding clusters (clusters 2 and 5) consistently presented higher CV values, reflecting higher tactical fragmentation and fatigue levels within the peloton. Conversely, less technically demanding clusters (0 and 3) exhibited lower CV values, indicating more homogeneous collective performance (<xref ref-type="fig" rid="F3">Figure&#x00A0;3</xref>).</p>
<fig id="F3" position="float"><label>Figure 3</label>
<caption><p>Distribution of collective performance variability (CV) by technical stage cluster (excluding cluster 4). Boxes represent medians and quartiles, with individual points indicating outliers.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1661456-g003.tif"><alt-text content-type="machine-generated">Box plot showing performance dispersion across five technical clusters labeled zero to four. Each cluster has unique colors. The y-axis represents performance dispersion, and the x-axis represents technical clusters. Diamonds indicate means, with individual data points scattered within each cluster. Cluster zero shows higher dispersion compared to others.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3d"><label>3.4</label><title>Temporal trend of performance CV (2017&#x2013;2023)</title>
<p>To explore the temporal evolution of collective performance variability, the annual mean CV for each cluster from 2017 to 2023 was analyzed (<xref ref-type="fig" rid="F4">Figure&#x00A0;4</xref>). Overall, clusters displayed a broadly downward pattern in CV, indicating progressively more homogeneous performance; however, a pooled linear trend test of annual mean CV against calendar year with cluster fixed effects did not reach statistical significance over 2017&#x2013;2023 (<italic>p</italic>&#x2009;&#x003D;&#x2009;0.315; R<sup>2</sup>&#x2009;&#x003D;&#x2009;0.85). Note that the high R<sup>2</sup> largely reflects between-cluster differences captured by the fixed effects; the incremental variance explained by calendar year was small (&#x0394;R<sup>2</sup>&#x2009;&#x2248;&#x2009;0.04), consistent with the non-significant slope. Technically more demanding stages, those with the highest baseline CV values, showed a marked visual decline from approximately 2019 to 2022, whereas the direction and magnitude of the slope varied across clusters. In less demanding stages, CV values were consistently lower (0.52&#x2013;0.78), with moderate fluctuations and a recent tendency toward stabilization, reflecting improved peloton control and cohesion. Taking together, these temporal patterns suggest increasing homogeneity of performance over the period, while acknowledging heterogeneity in cluster-specific trajectories.</p>
<fig id="F4" position="float"><label>Figure 4</label>
<caption><p>Temporal trend of the coefficient of variation (CV) of performance by technical stage cluster (2017&#x2013;2023). Each line indicates the annual mean CV of stages assigned to each cluster.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1661456-g004.tif"><alt-text content-type="machine-generated">Line chart showing the coefficient of variation from 2017 to 2023 for five clusters, labeled 0, 1, 2, 3, and 5. Clusters exhibit varied trends, with some increasing and others decreasing over the years. The y-axis represents the coefficient of variation, and the x-axis marks the years. Each cluster is represented by a distinct color: cluster 0 in blue, 1 in orange, 2 in green, 3 in red, and 5 in purple.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3e"><label>3.5</label><title>Specific contribution of technical variables on performance CV</title>
<p>Multiple regression analysis assessed the specific influence of each technical variable on collective performance variability. Relative elevation per kilometer had the strongest effect (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.42, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), followed by the percentage of unpaved surfaces (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.23, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.01), total distance (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.18, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.05), and total vertical gain (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.11, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.05) (<xref ref-type="table" rid="T2">Table&#x00A0;2</xref>). Specifically, in the most demanding cluster (cluster 5), the influence of relative elevation increased significantly (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.62, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), highlighting its critical relevance in highly technical stages.</p>
<table-wrap id="T2" position="float"><label>Table 2</label>
<caption><p>Relative contribution of technical variables to collective performance variability.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Technical variable</th>
<th valign="top" align="center"><italic>&#x03B2;</italic></th>
<th valign="top" align="center"><italic>p</italic>-valor</th>
<th valign="top" align="center">Relative contribution (&#x0025;)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Relative elevation (m/km)</td>
<td valign="top" align="center">0.42</td>
<td valign="top" align="center">&#x003C;0.001</td>
<td valign="top" align="center">45&#x0025;</td>
</tr>
<tr>
<td valign="top" align="left">Unpaved percentage (&#x0025;)</td>
<td valign="top" align="center">0.23</td>
<td valign="top" align="center">&#x003C;0.01</td>
<td valign="top" align="center">25&#x0025;</td>
</tr>
<tr>
<td valign="top" align="left">Distance (km)</td>
<td valign="top" align="center">0.18</td>
<td valign="top" align="center">&#x003C;0.05</td>
<td valign="top" align="center">20&#x0025;</td>
</tr>
<tr>
<td valign="top" align="left">Vertical gain (m)</td>
<td valign="top" align="center">0.11</td>
<td valign="top" align="center">&#x003C;0.05</td>
<td valign="top" align="center">10&#x0025;</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3f"><label>3.6</label><title>Bootstrap cross-validation of clustering</title>
<p>Bootstrap cross-validation (1,000 iterations) demonstrated high stability of the clustering, reflected by an average silhouette index of 0.62&#x2009;&#x00B1;&#x2009;0.03. Mean silhouette values &#x2265;0.5 indicate meaningful clustering structure; 0.62 lies within the &#x201C;reasonable&#x201D; band (0.51&#x2013;0.70) and thus supports the validity of the solution (<xref ref-type="bibr" rid="B25">25</xref>, <xref ref-type="bibr" rid="B27">27</xref>). The resulting distribution (<xref ref-type="fig" rid="F5">Figure&#x00A0;5</xref>) confirms the robust methodological stability and reproducibility of the proposed clustering solution.</p>
<fig id="F5" position="float"><label>Figure 5</label>
<caption><p>Distribution of the silhouette index obtained by bootstrap cross-validation (<italic>n</italic>&#x2009;&#x003D;&#x2009;1,000 iterations). Values above 0.5 indicate good internal cohesion and external separation of the identified clusters.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1661456-g005.tif"><alt-text content-type="machine-generated">Histogram of silhouette scores with frequency on the y-axis and score on the x-axis. The distribution is skewed right, with a mean of 0.51 and a median of 0.53 marked by dashed lines.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><label>4</label><title>Discussion</title>
<p>This study builds an objective; empirically derived technical classification of professional road-cycling stages using unsupervised learning and examines its association with variability in collective performance. Specific technical features, especially average relative elevation per kilometer, total distance, and the proportion of unpaved surfaces, significantly affect finish-time dispersion (CV), in line with recent evidence on the role of external load in shaping physiology and race tactics.</p>
<p>Technically demanding groups (clusters 2 and 5), defined by high relative elevation and extensive unpaved sections, consistently exhibited higher CV, indicating greater tactical fragmentation and accumulated fatigue. Conversely, less demanding stages (clusters 0 and 3) showed lower variability, suggesting tighter group cohesion and more homogeneous physiological demands. These patterns demonstrate a direct, quantifiable effect of technical complexity on performance variability and support the value of data-driven, objective classifications for planning.</p>
<p>The classification proved stable under bootstrap cross-validation (average silhouette&#x2009;&#x003D;&#x2009;0.62&#x2009;&#x00B1;&#x2009;0.03), underscoring reproducibility and validity. Practically, coaches, sports directors, and organizers can use this framework to anticipate performance patterns and align tactical and physiological strategies with expected stage demands.</p>
<p>A notable temporal finding is a significant global reduction in CV from 2017 to 2023, most marked in the technically demanding clusters (2 and 5). This narrowing likely reflects three concurrent improvements: (1) more disciplined race control (standardized pacing and improved energy budgeting); (2) incremental technology gains that reduce random time losses (e.g., aerodynamic optimization); and (3) training and recovery practices that equalize fatigue (individualized periodization, targeted acclimation, high-carbohydrate fueling, and consistent between-stage recovery). Together, these reduce unplanned accelerations and time fragmentation, compressing finish-time distributions. Although causal claims are not warranted, the trend plausibly aligns with continued professionalization of pacing and fueling in the WorldTour era: on-bike power meters enable tighter real-time intensity control and evidence-based pacing (<xref ref-type="bibr" rid="B28">28</xref>, <xref ref-type="bibr" rid="B29">29</xref>), while contemporary carbohydrate strategies, multiple-transportable blends delivering &#x2265;60&#x2013;90&#x2005;g&#x00B7;h<sup>&#x2212;1</sup> with gut training, stabilize late-race power and mitigate performance drift, consistent with narrower distributions (<xref ref-type="bibr" rid="B30">30</xref>, <xref ref-type="bibr" rid="B31">31</xref>).</p>
<p>Among all predictors, relative elevation per kilometer exerted the strongest influence on CV (<italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.42; <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), with an even larger effect in the most technical stages (cluster 5: <italic>&#x03B2;</italic>&#x2009;&#x003D;&#x2009;0.62; <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), emphasizing the centrality of gradient in training design and tactical planning.</p>
<p>The analysis relies on publicly available secondary data, which may introduce coverage and measurement biases. Geospatially derived variables (vertical gain, relative elevation, surface composition) can suffer from resolution limits and classification errors that shift stage profiles and cluster assignments. Event-specific timing protocols (e.g., neutralizations, timing resolution) may also affect CV estimates. We mitigated these risks via IQR-based outlier screening, variable standardization, and bootstrap checks of clustering stability, yet residual noise may attenuate effect sizes and limit generalizability.</p>
<p>A further limitation is the absence of direct physiological measurements (power output, heart rate, perceived exertion), which constrain mechanistic interpretation of internal responses to external technical loads. Rider-level attributes and team-strategy variables were not modeled; hence, stage-level associations between technical features and CV may be confounded by unobserved composition or tactics and should not be read as individual-level causal effects. Future work should incorporate direct physiological markers&#x2014;threshold metrics (lactate threshold/ventilatory threshold 2 or critical power) to stratify metabolic intensity; heart-rate variability (e.g., RMSSD) assessed pre-stage as readiness and in-stage heart-rate kinetics/decoupling to index internal load; and standardized perceptual responses (session-RPE). Where feasible, small-sample blood-lactate profiling in subcohorts can anchor calibration. Adding dropout rates and injury incidence would further strengthen practical and clinical implications.</p>
<p>Our dataset spans road events from 2017 to 2023 across men&#x0027;s and women&#x0027;s calendars, including one-day and stage races. Even so, the learned typology and CV associations may not transfer unchanged to contexts that deviate from the observed joint distribution&#x2014;e.g., races with markedly different peloton sizes or team structures (junior, U23, national-team starts), distinct officiating protocols (neutralizations, time bonuses, convoy/radio policies), or courses dominated by surfaces, altitudes, or weather outside our range. Such factors can inflate or dampen CV independently of our predictors. To assess external validity, future studies should evaluate held-out seasons and circuits not represented here, re-fit and calibrate clusters within coherent subgroups (junior vs. U23 vs. senior; time trials vs. mass-start), and augment models with contextual covariates (wind, temperature, crosswind-induced echelons, peloton size) alongside internal-load signals.</p>
</sec>
<sec id="s5" sec-type="conclusions"><label>5</label><title>Conclusions</title>
<p>This study provides a robust and objective empirical classification of professional cycling stages using advanced unsupervised learning techniques. Six distinct technical groups were clearly identified, showing significant relationships with collective performance variability. Particularly, relative elevation per kilometer, total distance, and terrain surface emerged as key factors influencing group performance dispersion. A significant reduction in the coefficient of variation of performance was observed between 2017 and 2023, especially in more technically demanding stages, reflecting specific advances in training methods, applied technology, and strategic management in professional cycling.</p>
<p>This objective technical classification offers a practical, quantitative tool directly applicable in real-world professional cycling contexts. Coaches, sports scientists, and team directors can leverage this empirical typology to optimize competitive strategies, tailor specific training loads according to stage types, and prevent risks related to accumulated fatigue and injury. Future research integrating direct physiological measurements and additional variables on injury incidence or dropout rates will enable a deeper understanding of the physiological, tactical, and clinical dimensions of professional cycling performance.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability"><title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://figshare.com/articles/dataset/Cycling_Analytics_Data_Sets/24566542">https://figshare.com/articles/dataset/Cycling_Analytics_Data_Sets/24566542</ext-link>.</p>
</sec>
<sec id="s7" sec-type="author-contributions"><title>Author contributions</title>
<p>IG-A: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. ED: Writing &#x2013; review &#x0026; editing. FV-F: Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec id="s8" sec-type="funding-information"><title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. APC support has been granted by IPN-SIP under the 2025 &#x201C;Apoyos Econ&#x00F3;micos para Publicaciones&#x201D; call.</p>
</sec>
<sec id="s9" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="ai-statement"><title>Generative AI statement</title>
<p>The author(s) declare that Generative AI was used in the creation of this manuscript. GPT-4, developed by OpenAI, was used to assist with the grammatical correction and refinement of the manuscript&#x0027;s writing.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s11" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanders</surname><given-names>D</given-names></name><name><surname>Heijboer</surname><given-names>M</given-names></name></person-group>. <article-title>Physical demands and power profile of different stage types within a cycling grand tour</article-title>. <source>Eur J Sport Sci</source>. (<year>2019</year>) <volume>19</volume>(<issue>6</issue>):<fpage>736</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1080/17461391.2018.1554706</pub-id><pub-id pub-id-type="pmid">30589390</pub-id></citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luc&#x00ED;a</surname><given-names>A</given-names></name><name><surname>Hoyos</surname><given-names>J</given-names></name><name><surname>Chicharro</surname><given-names>JL</given-names></name></person-group>. <article-title>Physiology of professional road cycling</article-title>. <source>Sports Med</source>. (<year>2001</year>) <volume>31</volume>(<issue>5</issue>):<fpage>325</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.2165/00007256-200131050-00004</pub-id></citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Abbiss</surname><given-names>CR</given-names></name><name><surname>Laursen</surname><given-names>PB</given-names></name></person-group>. <article-title>Describing and understanding pacing strategies during athletic competition</article-title>. <source>Sports Med Auckl NZ</source>. (<year>2008</year>) <volume>38</volume>(<issue>3</issue>):<fpage>239</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.2165/00007256-200838030-00004</pub-id></citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>VAN Erp</surname><given-names>T</given-names></name><name><surname>Sanders</surname><given-names>D</given-names></name><name><surname>Lamberts</surname><given-names>RP</given-names></name></person-group>. <article-title>Maintaining power output with accumulating levels of work done is a key determinant for success in professional cycling</article-title>. <source>Med Sci Sports Exerc</source>. (<year>2021</year>) <volume>53</volume>(<issue>9</issue>):<fpage>1903</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1249/MSS.0000000000002656</pub-id><pub-id pub-id-type="pmid">33731651</pub-id></citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Passfield</surname><given-names>L</given-names></name><name><surname>Hopker</surname><given-names>JG</given-names></name><name><surname>Jobson</surname><given-names>S</given-names></name><name><surname>Friel</surname><given-names>D</given-names></name><name><surname>Zabala</surname><given-names>M</given-names></name></person-group>. <article-title>Knowledge is power: issues of measuring training and performance in cycling</article-title>. <source>J Sports Sci</source>. (<year>2017</year>) <volume>35</volume>(<issue>14</issue>):<fpage>1426</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1080/02640414.2016.1215504</pub-id><pub-id pub-id-type="pmid">27686573</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mujika</surname><given-names>I</given-names></name><name><surname>Padilla</surname><given-names>S</given-names></name></person-group>. <article-title>Cardiorespiratory and metabolic characteristics of detraining in humans</article-title>. <source>Med Sci Sports Exerc</source>. (<year>2001</year>) <volume>33</volume>(<issue>3</issue>):<fpage>413</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1097/00005768-200103000-00013</pub-id><pub-id pub-id-type="pmid">11252068</pub-id></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Valenzuela</surname><given-names>PL</given-names></name><name><surname>Mateo-March</surname><given-names>M</given-names></name><name><surname>Muriel</surname><given-names>X</given-names></name><name><surname>Zabala</surname><given-names>M</given-names></name><name><surname>Lucia</surname><given-names>A</given-names></name><name><surname>Pallares</surname><given-names>JG</given-names></name><etal/></person-group> <article-title>Road gradient and cycling power: an observational study in male professional cyclists</article-title>. <source>J Sci Med Sport</source>. (<year>2022</year>) <volume>25</volume>(<issue>12</issue>):<fpage>1017</fpage>&#x2013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1016/j.jsams.2022.10.001</pub-id><pub-id pub-id-type="pmid">36243662</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Ashtiani</surname><given-names>F</given-names></name><name><surname>Sreedhara</surname><given-names>VSM</given-names></name><name><surname>Vahidi</surname><given-names>A</given-names></name><name><surname>Hutchison</surname><given-names>R</given-names></name><name><surname>Mocko</surname><given-names>G</given-names></name></person-group><article-title>. Experimental modeling of cyclists fatigue and recovery dynamics enabling optimal pacing in a time trial</article-title>. (<year>2019</year>). p. <fpage>5083</fpage>&#x2013;<lpage>8</lpage>.</citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ammann</surname><given-names>L</given-names></name><name><surname>Chmura</surname><given-names>P</given-names></name></person-group>. <article-title>Internal and external load during on-field training drills with an aim of improving the physical performance of players in professional soccer: a retrospective observational study</article-title>. <source>Front Physiol</source>. (<year>2023</year>) <volume>14</volume>. <pub-id pub-id-type="doi">10.3389/fphys.2023.1212573</pub-id><pub-id pub-id-type="pmid">38028802</pub-id></citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>G</given-names></name><name><surname>Shang</surname><given-names>L</given-names></name><name><surname>Qin</surname><given-names>S</given-names></name><name><surname>Yu</surname><given-names>H</given-names></name></person-group>. <article-title>The impact of internal and external loads on player performance in Chinese basketball association</article-title>. <source>BMC Sports Sci Med Rehabil</source>. (<year>2024</year>) <volume>16</volume>(<issue>1</issue>):<fpage>194</fpage>. <pub-id pub-id-type="doi">10.1186/s13102-024-00983-6</pub-id><pub-id pub-id-type="pmid">39289748</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname><given-names>K</given-names></name></person-group>. <article-title>Quarterly fluctuations in external and internal loads among professional basketball players</article-title>. <source>Front Physiol</source>. (<year>2024</year>) <volume>15</volume>. <pub-id pub-id-type="doi">10.3389/fphys.2024.1419097</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mateo-March</surname><given-names>M</given-names></name><name><surname>Valenzuela</surname><given-names>PL</given-names></name><name><surname>Muriel</surname><given-names>X</given-names></name><name><surname>Gandia-Soriano</surname><given-names>A</given-names></name><name><surname>Zabala</surname><given-names>M</given-names></name><name><surname>Lucia</surname><given-names>A</given-names></name><etal/></person-group> <article-title>The record power profile of male professional cyclists: fatigue matters</article-title>. <source>Int J Sports Physiol Perform</source>. (<year>2022</year>) <volume>17</volume>(<issue>6</issue>):<fpage>926</fpage>&#x2013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1123/ijspp.2021-0403</pub-id><pub-id pub-id-type="pmid">35240578</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bonato</surname><given-names>G</given-names></name><name><surname>Goodman</surname><given-names>SPJ</given-names></name><name><surname>Tjh</surname><given-names>L</given-names></name></person-group>. <article-title>Physiological and performance effects of live high train low altitude training for elite endurance athletes: a narrative review</article-title>. <source>Curr Res Physiol</source>. (<year>2023</year>) <volume>6</volume>:<fpage>100113</fpage>. <pub-id pub-id-type="doi">10.1016/j.crphys.2023.100113</pub-id><pub-id pub-id-type="pmid">38107789</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Turner</surname><given-names>MM</given-names></name></person-group>. <article-title>Cycling on rough roads: a model for resistance and vibration</article-title>. <source>Veh Syst Dyn</source>. (<year>2024</year>) <volume>62</volume>(<issue>10</issue>):<fpage>2729</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1080/00423114.2024.2304031</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Davis</surname><given-names>J</given-names></name><name><surname>Bransen</surname><given-names>L</given-names></name><name><surname>Devos</surname><given-names>L</given-names></name><name><surname>Jaspers</surname><given-names>A</given-names></name><name><surname>Meert</surname><given-names>W</given-names></name><name><surname>Robberechts</surname><given-names>P</given-names></name><etal/></person-group> <article-title>Methodology and evaluation in sports analytics: challenges, approaches, and lessons learned</article-title>. <source>Mach Learn</source>. (<year>2024</year>) <volume>113</volume>(<issue>9</issue>):<fpage>6977</fpage>&#x2013;<lpage>7010</lpage>. <pub-id pub-id-type="doi">10.1007/s10994-024-06585-0</pub-id></citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xia</surname><given-names>J</given-names></name><name><surname>Wang</surname><given-names>J</given-names></name><name><surname>Chen</surname><given-names>H</given-names></name><name><surname>Zhuang</surname><given-names>J</given-names></name><name><surname>Cao</surname><given-names>Z</given-names></name><name><surname>Chen</surname><given-names>P</given-names></name></person-group>. <article-title>An unsupervised machine learning approach to evaluate sports facilities condition in primary school</article-title>. <source>PLoS One</source>. (<year>2022</year>) <volume>17</volume>(<issue>4</issue>). <pub-id pub-id-type="doi">10.1371/journal.pone.0267009</pub-id></citation></ref>
<ref id="B17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rivadulla</surname><given-names>AR</given-names></name><name><surname>Chen</surname><given-names>X</given-names></name><name><surname>Cazzola</surname><given-names>D</given-names></name><name><surname>Trewartha</surname><given-names>G</given-names></name><name><surname>Preatoni</surname><given-names>E</given-names></name></person-group>. <article-title>Clustering analysis across different speeds reveals two distinct running techniques with no differences in running economy</article-title>. <source>Sports Biomech</source>. (<year>2024</year>) <volume>11</volume>:<fpage>1</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1080/14763141.2024.2372608</pub-id></citation></ref>
<ref id="B18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname><given-names>JA</given-names></name><name><surname>Stiffler-Joachim</surname><given-names>MR</given-names></name><name><surname>Wille</surname><given-names>CM</given-names></name><name><surname>Heiderscheit</surname><given-names>BC</given-names></name></person-group>. <article-title>A hierarchical clustering approach for examining potential risk factors for bone stress injury in runners</article-title>. <source>J Biomech</source>. (<year>2022</year>) <volume>141</volume>:<fpage>111136</fpage>. <pub-id pub-id-type="doi">10.1016/j.jbiomech.2022.111136</pub-id><pub-id pub-id-type="pmid">35816783</pub-id></citation></ref>
<ref id="B19"><label>19.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Bouvet</surname><given-names>A</given-names></name><name><surname>Kolei</surname><given-names>SE</given-names></name><name><surname>Marbac</surname><given-names>M</given-names></name></person-group>. <article-title>Investigating swimming technical skills by a double partition clustering of multivariate functional data allowing for dimension selection [Internet]</article-title>. <comment><italic>arXiv</italic></comment>. (<year>2023</year>). <comment>Disponible en:</comment> <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/2303.15812">http://arxiv.org/abs/2303.15812</ext-link></citation></ref>
<ref id="B20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reis</surname><given-names>FJJ</given-names></name><name><surname>Alaiti</surname><given-names>RK</given-names></name><name><surname>Vallio</surname><given-names>CS</given-names></name><name><surname>Hespanhol</surname><given-names>L</given-names></name></person-group>. <article-title>Artificial intelligence and machine learning approaches in sports: concepts, applications, challenges, and future perspectives</article-title>. <source>Braz J Phys Ther</source>. (<year>2024</year>) <volume>28</volume>(<issue>3</issue>):<fpage>101083</fpage>. <pub-id pub-id-type="doi">10.1016/j.bjpt.2024.101083</pub-id><pub-id pub-id-type="pmid">38838418</pub-id></citation></ref>
<ref id="B21"><label>21.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Phillips</surname><given-names>KE</given-names></name></person-group>. <source>An Examination of the Factors Determining the Performance of Cyclists in Elite Competitions</source>. <publisher-loc>Melbourne</publisher-loc>: <publisher-name>Victoria University</publisher-name> (<year>2020</year>).</citation></ref>
<ref id="B22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ausloos</surname><given-names>M</given-names></name></person-group>. <article-title>Shannon entropy and Herfindahl-Hirschman index as team&#x2019;s performance and competitive balance indicators in cyclist multi-stage races</article-title>. <source>Entropy</source>. (<year>2023</year>) <volume>25</volume>(<issue>6</issue>):<fpage>955</fpage>. <pub-id pub-id-type="doi">10.3390/e25060955</pub-id><pub-id pub-id-type="pmid">37372299</pub-id></citation></ref>
<ref id="B23"><label>23.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Janssens</surname><given-names>B</given-names></name><name><surname>Pappalardo</surname><given-names>L</given-names></name><name><surname>Bock</surname><given-names>JD</given-names></name><name><surname>Bogaert</surname><given-names>M</given-names></name><name><surname>Verstockt</surname><given-names>S</given-names></name></person-group>. <article-title>Geospatial Road Cycling Race Results Data Set</article-title>. <comment><italic>arXiv</italic></comment>. (<year>2024</year>).</citation></ref>
<ref id="B24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lloyd</surname><given-names>S</given-names></name></person-group>. <article-title>Least squares quantization in PCM</article-title>. <source>IEEE Trans Inf Theory</source>. (<year>1982</year>) <volume>28</volume>(<issue>2</issue>):<fpage>129</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.1109/TIT.1982.1056489</pub-id></citation></ref>
<ref id="B25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rousseeuw</surname><given-names>PJ</given-names></name></person-group>. <article-title>Silhouettes: a graphical aid to the interpretation and validation of cluster analysis</article-title>. <source>J Comput Appl Math</source>. (<year>1987</year>) <volume>20</volume>:<fpage>53</fpage>&#x2013;<lpage>65</lpage>. <pub-id pub-id-type="doi">10.1016/0377-0427(87)90125-7</pub-id></citation></ref>
<ref id="B26"><label>26.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wold</surname><given-names>S</given-names></name><name><surname>Esbensen</surname><given-names>K</given-names></name><name><surname>Geladi</surname><given-names>P</given-names></name></person-group>. <article-title>Principal component analysis</article-title>. <source>Chemom Intell Lab Syst</source>. (<year>1987</year>) <volume>2</volume>(<issue>1</issue>):<fpage>37</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1016/0169-7439(87)80084-9</pub-id></citation></ref>
<ref id="B27"><label>27.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Kaufman</surname><given-names>L</given-names></name><name><surname>Rousseeuw</surname><given-names>PJ</given-names></name></person-group>. <source>Finding Groups in Data: An Introduction to Cluster Analysis [Internet]</source>. <edition>1st ed.</edition> <publisher-loc>New York</publisher-loc>: <publisher-name>Wiley</publisher-name> (<year>1990</year>). <comment>Disponible en</comment>: <ext-link ext-link-type="uri" xlink:href="https://onlinelibrary.wiley.com/doi/book/10.1002/9780470316801">https://onlinelibrary.wiley.com/doi/book/10.1002/9780470316801</ext-link></citation></ref>
<ref id="B28"><label>28.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sundstr&#x00F6;m</surname><given-names>D</given-names></name><name><surname>Carlsson</surname><given-names>P</given-names></name><name><surname>Tinnsten</surname><given-names>M</given-names></name></person-group>. <article-title>On optimization of pacing strategy in road cycling</article-title>. <source>Procedia Eng</source>. (<year>2013</year>) <volume>60</volume>:<fpage>118</fpage>&#x2013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1016/j.proeng.2013.07.062</pub-id></citation></ref>
<ref id="B29"><label>29.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leo</surname><given-names>P</given-names></name><name><surname>Spragg</surname><given-names>J</given-names></name><name><surname>Podlogar</surname><given-names>T</given-names></name><name><surname>Lawley</surname><given-names>JS</given-names></name><name><surname>Mujika</surname><given-names>I</given-names></name></person-group>. <article-title>Power profiling and the power-duration relationship in cycling: a narrative review</article-title>. <source>Eur J Appl Physiol</source>. (<year>2022</year>) <volume>122</volume>(<issue>2</issue>):<fpage>301</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1007/s00421-021-04833-y</pub-id><pub-id pub-id-type="pmid">34708276</pub-id></citation></ref>
<ref id="B30"><label>30.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jeukendrup</surname><given-names>AE</given-names></name></person-group>. <article-title>Nutrition for endurance sports: marathon, triathlon, and road cycling</article-title>. <source>J Sports Sci</source>. (<year>2011</year>) <volume>29</volume>(<issue>Suppl 1</issue>):<fpage>S91</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1080/02640414.2011.610348</pub-id><pub-id pub-id-type="pmid">21916794</pub-id></citation></ref>
<ref id="B31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Burke</surname><given-names>LM</given-names></name><name><surname>Hawley</surname><given-names>JA</given-names></name><name><surname>Jeukendrup</surname><given-names>A</given-names></name><name><surname>Morton</surname><given-names>JP</given-names></name><name><surname>Stellingwerff</surname><given-names>T</given-names></name><name><surname>Maughan</surname><given-names>RJ</given-names></name></person-group>. <article-title>Toward a common understanding of diet-exercise strategies to manipulate fuel availability for training and competition preparation in endurance sport</article-title>. <source>Int J Sport Nutr Exerc Metab</source>. (<year>2018</year>) <volume>28</volume>(<issue>5</issue>):<fpage>451</fpage>&#x2013;<lpage>63</lpage>. <pub-id pub-id-type="doi">10.1123/ijsnem.2018-0289</pub-id><pub-id pub-id-type="pmid">30249148</pub-id></citation></ref></ref-list>
</back>
</article>