<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychol.</journal-id>
<journal-title>Frontiers in Psychology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychol.</abbrev-journal-title>
<issn pub-type="epub">1664-1078</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyg.2025.1516417</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Goal and shot prediction in ball possessions in FIFA Women&#x2019;s World Cup 2023: a machine learning approach</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Iv&#x00E1;n-Baraga&#x00F1;o</surname> <given-names>Iy&#x00E1;n</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/849837/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Ard&#x00E1;</surname> <given-names>Antonio</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/459484/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Losada</surname> <given-names>Jos&#x00E9; L.</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/209644/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Maneiro</surname> <given-names>Rub&#x00E9;n</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/403289/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Sport Sciences, Faculty of Medicine, Health and Sports, Universidad Europea de Madrid</institution>, <addr-line>Madrid</addr-line>, <country>Spain</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Physical and Sport Education, University of A Coru&#x00F1;a</institution>, <addr-line>A Coru&#x00F1;a</addr-line>, <country>Spain</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Social Psychology and Quantitative Phycology, University of Barcelona</institution>, <addr-line>Barcelona</addr-line>, <country>Spain</country></aff>
<aff id="aff4"><sup>4</sup><institution>Faculty of Education and Sport, University of Vigo</institution>, <addr-line>Vigo</addr-line>, <country>Spain</country></aff>
<author-notes>
<fn id="fn0001" fn-type="edited-by"><p>Edited by: Yixiong Cui, Beijing Sport University, China</p></fn>
<fn id="fn0002" fn-type="edited-by"><p>Reviewed by: Miguel Pic, University of Valladolid, Spain</p>
<p>Zhaoxian Zhou, University of Southern Mississippi, United States</p></fn>
<corresp id="c001">&#x002A;Correspondence: Iy&#x00E1;n Iv&#x00E1;n-Baraga&#x00F1;o, <email>iyanivanbaragano@gmail.com</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>31</day>
<month>01</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1516417</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>10</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>22</day>
<month>01</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Iv&#x00E1;n-Baraga&#x00F1;o, Ard&#x00E1;, Losada and Maneiro.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Iv&#x00E1;n-Baraga&#x00F1;o, Ard&#x00E1;, Losada and Maneiro</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Research in women&#x2019;s football and the use of new game analysis tools have developed significantly in recent years. The objectives of this study were to create two predictive classification models to forecast the occurrence of a shot or a goal in the FIFA Women&#x2019;s World Cup 2023 and to identify the associated technical-tactical indicators to these outcomes.</p>
</sec>
<sec>
<title>Methods</title>
<p>A total of 2,346 ball possessions were analyzed using an observational design, mapping two different target variables (Success&#x202F;=&#x202F;Goal and Success2&#x202F;=&#x202F;Goal or Shot) with a relative frequency of 1.28 and 8.35%, respectively. The predictive capacity was tested using Random Forest and XGBoost and finally and SHAP values were calculated and visualized to understand the influence of the predictors.</p>
</sec>
<sec>
<title>Results</title>
<p>Random Forest technique showed greater efficacy, with recall and sensitivity above 93% in the resampled dataset. However, recall on the original test sample was 13% (Success&#x202F;=&#x202F;Shot or Goal) and 0% (Success&#x202F;=&#x202F;Goal), demonstrating the models&#x2019; inability to predict rare events in football, such as goals. The indicators with the greatest influence on the outcome of these possessions were related to the possession zone, attack duration, number of passes, and starting zone, among others.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>The results highlight the need to incorporate a greater number of predictive variables in the models and underline the difficulty of predicting events such as goals and shots in women&#x2019;s football.</p>
</sec>
</abstract>
<kwd-group>
<kwd>female football</kwd>
<kwd>women&#x2019;s soccer</kwd>
<kwd>predictive models</kwd>
<kwd>machine learning</kwd>
<kwd>performance analysis</kwd>
<kwd>FIFA Women&#x2019;s World Cup 2023</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="48"/>
<page-count count="10"/>
<word-count count="6134"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Movement Science</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>The analysis of technical-tactical performance in men&#x2019;s football began to develop significantly in the late 20th and early 21st centuries (<xref ref-type="bibr" rid="ref14">Hughes and Bartlett, 2002</xref>), using notational and observational records (<xref ref-type="bibr" rid="ref39">Preciado et al., 2019</xref>). Later, with the use of new technologies, this analysis started to be conducted on data obtained from positional sensors such as Global Positioning System (GPS) and Local Positioning System (LPM) (<xref ref-type="bibr" rid="ref25">Low et al., 2020</xref>). In the case of women&#x2019;s football, the lower participation of women in the sport and a lack of social and research interest delayed the publication of the first studies by more than a decade (<xref ref-type="bibr" rid="ref18">Kirkendall, 2007</xref>; <xref ref-type="bibr" rid="ref30">Mara et al., 2012</xref>; <xref ref-type="bibr" rid="ref47">Leite, 2013</xref>). A significant increase in research occurred starting in 2020, coinciding with the FIFA Women&#x2019;s World Cup 2019 (<xref ref-type="bibr" rid="ref22">Lee and Mills, 2021</xref>; <xref ref-type="bibr" rid="ref16">Iv&#x00E1;n-Baraga&#x00F1;o et al., 2022</xref>; <xref ref-type="bibr" rid="ref19">Kubayi, 2022</xref>) and, later, with the FIFA Women&#x2019;s World Cup 2023 (<xref ref-type="bibr" rid="ref8">Branquinho et al., 2024</xref>; <xref ref-type="bibr" rid="ref6">Bradley, 2025a</xref>, <xref ref-type="bibr" rid="ref7">2025b</xref>; <xref ref-type="bibr" rid="ref17">Iv&#x00E1;n-Baraga&#x00F1;o et al., 2025</xref>; <xref ref-type="bibr" rid="ref34">Oliva-Lozano et al., 2025</xref>).</p>
<p>Currently, Artificial Intelligence, and Machine Learning in particular, have become topics of interest for researchers and practitioners (<xref ref-type="bibr" rid="ref33">Nassis et al., 2023</xref>; <xref ref-type="bibr" rid="ref40">Rico-Gonz&#x00E1;lez et al., 2023</xref>), who have conducted studies with various objectives, such as establishing differences between men&#x2019;s and women&#x2019;s football (<xref ref-type="bibr" rid="ref35">Pappalardo et al., 2021</xref>), predicting injury risk (<xref ref-type="bibr" rid="ref41">Robles-Palaz&#x00F3;n et al., 2021</xref>), or the probability of success of different types of actions, such as entries into the penalty area (<xref ref-type="bibr" rid="ref15">Iv&#x00E1;n-Baraga&#x00F1;o et al., 2021</xref>; <xref ref-type="bibr" rid="ref46">Stival et al., 2023</xref>) or shots during set-piece situations (<xref ref-type="bibr" rid="ref28">Maneiro et al., 2019</xref>). In all of these studies, different regression and/or classification models were trained with the aim of predicting outcomes or future behaviors.</p>
<p>More recently, other studies have attempted to apply more complex strategies, materialized in the use of various techniques based on deep neural networks. Among the different examples of the use and application of Artificial Intelligence in the analysis of high-performance football, the article by <xref ref-type="bibr" rid="ref2">AlMulla et al. (2023)</xref> trained a deep neural network model (Gated Recurrent Unit) to predict the outcomes of football matches in the Qatari league over 10 consecutive seasons, using data from data providers. Similarly, <xref ref-type="bibr" rid="ref48">Wang et al. (2024)</xref> trained and evaluated a generative AI model based on deep learning and graph methods, which allowed the generation of execution proposals for set-piece actions. This was part of an unusual collaboration between Google DeepMind and Liverpool FC. Despite this, and in agreement with <xref ref-type="bibr" rid="ref11">Claudino et al. (2019)</xref> the synergy that Artificial Intelligence needs to create alongside football still requires further development in the coming years.</p>
<p>This gap is even more pronounced in the case of women&#x2019;s football, with scarce scientific evidence where AI or ML has been applied to female samples. In this regard, some authors have sought to understand the differences between men&#x2019;s and women&#x2019;s football (<xref ref-type="bibr" rid="ref35">Pappalardo et al., 2021</xref>) using supervised ML techniques and applying explainability methods such as SHAP values (<xref ref-type="bibr" rid="ref26">Lundberg and Lee, 2017</xref>). On the other hand, other studies have conducted analyses of offensive play using supervised techniques such as binary logistic regression (<xref ref-type="bibr" rid="ref16">Iv&#x00E1;n-Baraga&#x00F1;o et al., 2022</xref>), multinomial logistic regression (<xref ref-type="bibr" rid="ref9">Casal et al., 2023</xref>), or decision trees (<xref ref-type="bibr" rid="ref28">Maneiro et al., 2019</xref>). Additionally, some authors (<xref ref-type="bibr" rid="ref44">Shen et al., 2024</xref>) have proposed models focused on convolutional neural networks and computer vision to determine offensive positioning in women&#x2019;s football, using images extracted from UEFA Women&#x2019;s Champions League matches.</p>
<p>In any case, and as a common aspect of studies conducted using supervised machine learning classification techniques, most studies have been carried out using methods characterized by high intrinsic explainability (such as decision trees or logistic regression), but often with moderate performance. In this context, there is a need to improve the performance of predictive models applied to a chaotic and non-linear reality like football, without sacrificing interpretability, to ensure the application of these studies&#x2019; results to training and competition.</p>
<p>For the reasons mentioned above, the objective of this study was twofold. First, it aimed to create two binary classification models that would allow the prediction of the outcome of ball possessions in elite women&#x2019;s football (i.e., whether the possessions end in a Goal or a Shot). Additionally, once these models were trained, the SHAP library was implemented to identify the technical-tactical performance indicators that had the greatest influence on the model.</p>
</sec>
<sec sec-type="materials|methods" id="sec2">
<label>2</label>
<title>Materials and methods</title>
<sec id="sec3">
<label>2.1</label>
<title>Design and participants</title>
<p>The study was framed within the systematic observational methodology proposed by <xref ref-type="bibr" rid="ref3">Anguera (1979)</xref> employing a nomothetic design, as multiple units of analysis were examined, represented by each participating team; it featured punctual inter-sessional tracking due to the temporal association between the actions analyzed within a single match; and it was multidimensional, as the observation instrument addressed the dimensions of identification, initiation, development, and outcome of ball possessions (<xref ref-type="bibr" rid="ref4">Anguera et al., 2011</xref>).</p>
<p>All ball possessions during the final phase (from the Round of 16 onwards) of the FIFA Women&#x2019;s World Cup 2023 were analyzed, provided they met the following inclusion criteria: (i) a minimum duration of 4&#x202F;s, and (ii) the possession must involve two consecutive touches of the ball, a pass, or a shot (<xref ref-type="bibr" rid="ref1">Almeida et al., 2014</xref>).</p>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>Observation and recording instrument</title>
<p>The observation instrument was created by a panel of experts, including three researchers with over 30&#x202F;years of experience in observational methodology and can be consulted in <xref ref-type="table" rid="tab1">Table 1</xref>. It comprised 18 criteria, and 51 categories. The analyzed criteria were organized in 4 dimensions corresponding to identification, start, development and outcome of the ball possession. The recording instrument used for this study was LINCE PLUS (<xref ref-type="bibr" rid="ref45">Soto-Fern&#x00E1;ndez et al., 2021</xref>).</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption><p>Observational instrument: criteria, categories, and operational definition.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Criteria</th>
<th align="left" valign="top">Categories</th>
<th align="left" valign="top">Operational definition</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Observe team</td>
<td align="left" valign="top">Teams analyzed</td>
<td align="left" valign="top">The team that executed the ball possession</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="3">Match outcome</td>
<td align="left" valign="top">Win</td>
<td align="left" valign="top">The team observed won the match</td>
</tr>
<tr>
<td align="left" valign="top">Lose</td>
<td align="left" valign="top">The team observed lost the match</td>
</tr>
<tr>
<td align="left" valign="top">Draw</td>
<td align="left" valign="top">The team observed draw the match</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="6">Time</td>
<td align="left" valign="top">1Q</td>
<td align="left" valign="top">Possession starts between the start of the game and minute 1</td>
</tr>
<tr>
<td align="left" valign="top">2Q</td>
<td align="left" valign="top">Possession starts between minute 16 and minute 30</td>
</tr>
<tr>
<td align="left" valign="top">3Q</td>
<td align="left" valign="top">Possession starts between minute 31 and the end of the first half</td>
</tr>
<tr>
<td align="left" valign="top">4Q</td>
<td align="left" valign="top">Possession starts between the start of the second half and minute 60</td>
</tr>
<tr>
<td align="left" valign="top">5Q</td>
<td align="left" valign="top">Possession starts between minute 61 and minute 75</td>
</tr>
<tr>
<td align="left" valign="top">6Q</td>
<td align="left" valign="top">Possession starts between minute 76 and the end of the game</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="3">Match status</td>
<td align="left" valign="top">Winning</td>
<td align="left" valign="top">The team observed is winning when the action starts</td>
</tr>
<tr>
<td align="left" valign="top">Drawing</td>
<td align="left" valign="top">The teams are level when the action starts</td>
</tr>
<tr>
<td align="left" valign="top">Losing</td>
<td align="left" valign="top">The team observed is losing when the action starts</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="2">Start form</td>
<td align="left" valign="top">Set Play</td>
<td align="left" valign="top">Possession begins after a regulatory interruption of the game.</td>
</tr>
<tr>
<td align="left" valign="top">Transition</td>
<td align="left" valign="top">Possession begins without a regulatory interruption.</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="5">Start zone (length)</td>
<td align="left" valign="top">Defensive</td>
<td align="left" valign="top">Possession begins in the defensive area of the pitch</td>
</tr>
<tr>
<td align="left" valign="top">Predefensive</td>
<td align="left" valign="top">Possession begins in the predefensive area of the pitch</td>
</tr>
<tr>
<td align="left" valign="top">Middle</td>
<td align="left" valign="top">Possession begins in the middle area of the pitch</td>
</tr>
<tr>
<td align="left" valign="top">Preoffensive</td>
<td align="left" valign="top">Possession begins in the preoffensive area of the pitch</td>
</tr>
<tr>
<td align="left" valign="top">Offensive</td>
<td align="left" valign="top">Possession begins in the offensive area of the pitch</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="3">Start zone (width)</td>
<td align="left" valign="top">Left</td>
<td align="left" valign="top">Possession starts from the left wing</td>
</tr>
<tr>
<td align="left" valign="top">Central</td>
<td align="left" valign="top">Possession starts from the center</td>
</tr>
<tr>
<td align="left" valign="top">Right</td>
<td align="left" valign="top">Possession starts from the right wing</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="2">Defensive organization</td>
<td align="left" valign="top">Organized</td>
<td align="left" valign="top">The opposing team is defensively organized</td>
</tr>
<tr>
<td align="left" valign="top">Circumstantial</td>
<td align="left" valign="top">The opposing team is defensively disorganized</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="3">Defensive positioning</td>
<td align="left" valign="top">Low</td>
<td align="left" valign="top">Opponents positioning is at the back at the start of the action</td>
</tr>
<tr>
<td align="left" valign="top">Medium</td>
<td align="left" valign="top">Opponents positioning is midfield at the start of the action</td>
</tr>
<tr>
<td align="left" valign="top">Advanced</td>
<td align="left" valign="top">Opponents positioning is forward at the start of the action</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="10">Interaction context</td>
<td align="left" valign="top">MM</td>
<td align="left" valign="top">Midfield zone vs. midfield zone</td>
</tr>
<tr>
<td align="left" valign="top">RA</td>
<td align="left" valign="top">Rear zone vs. forward zone</td>
</tr>
<tr>
<td align="left" valign="top">RM</td>
<td align="left" valign="top">Rear zone vs. midfield zone</td>
</tr>
<tr>
<td align="left" valign="top">A0</td>
<td align="left" valign="top">Forward zone vs. goalkeeper</td>
</tr>
<tr>
<td align="left" valign="top">AA</td>
<td align="left" valign="top">Forward zone vs. forward zone</td>
</tr>
<tr>
<td align="left" valign="top">AM</td>
<td align="left" valign="top">Forward zone vs. midfield</td>
</tr>
<tr>
<td align="left" valign="top">AR</td>
<td align="left" valign="top">Forward zone vs. rear zone</td>
</tr>
<tr>
<td align="left" valign="top">MA</td>
<td align="left" valign="top">Midfield zone vs. forward zone</td>
</tr>
<tr>
<td align="left" valign="top">MR</td>
<td align="left" valign="top">Midfield zone vs. rear zone</td>
</tr>
<tr>
<td align="left" valign="top">PA</td>
<td align="left" valign="top">Goalkeeper vs. forward zone</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="2">Offensive intention</td>
<td align="left" valign="top">Keep</td>
<td align="left" valign="top">The team observed tries to maintain possession of the ball</td>
</tr>
<tr>
<td align="left" valign="top">Progress</td>
<td align="left" valign="top">The team observed tries to progress towards the rival goal</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="2">Defensive intention</td>
<td align="left" valign="top">No pressure</td>
<td align="left" valign="top">The opposing team shows an intention to defend their goal</td>
</tr>
<tr>
<td align="left" valign="top">Pressure</td>
<td align="left" valign="top">The opposing team shows an intention to recover the ball</td>
</tr>
<tr>
<td align="left" valign="top">MD (seconds)</td>
<td/>
<td align="left" valign="top">Time of possession in own half (in seconds)</td>
</tr>
<tr>
<td align="left" valign="top">MO (seconds)</td>
<td/>
<td align="left" valign="top">Time of possession in opponent&#x2019;s half (in seconds)</td>
</tr>
<tr>
<td align="left" valign="top">Possession time</td>
<td/>
<td align="left" valign="top">Total time of possession</td>
</tr>
<tr>
<td align="left" valign="top">Passes</td>
<td/>
<td align="left" valign="top">Number of passes</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="2">Possession zone</td>
<td align="left" valign="top">MD</td>
<td align="left" valign="top">Most possession in own half</td>
</tr>
<tr>
<td align="left" valign="top">MO</td>
<td align="left" valign="top">Most possession in opponent&#x2019;s half</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="4">Possession outcome</td>
<td align="left" valign="top">Goal</td>
<td align="left" valign="top">The possession ends with a goal</td>
</tr>
<tr>
<td align="left" valign="top">Shot</td>
<td align="left" valign="top">The possession ends with a shot</td>
</tr>
<tr>
<td align="left" valign="top">Sent to area</td>
<td align="left" valign="top">The possession ends with a ball into the penalty area</td>
</tr>
<tr>
<td align="left" valign="top">No success</td>
<td align="left" valign="top">The possession ends with no success.</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec5">
<label>2.3</label>
<title>Procedure and reliability</title>
<p>Prior to conducting the recording, the observers were trained and familiarized with the observation instrument over 4 sessions, following the procedure proposed by <xref ref-type="bibr" rid="ref24">Losada and Manolov (2015)</xref>. The reliability of the observation instrument was verified through the calculation of <xref ref-type="bibr" rid="ref12">Cohen&#x2019;s (1960)</xref> Kappa coefficient for both intra- and inter-observer reliability among the study&#x2019;s authors. The average obtained was 0.869 (range: 0.729&#x2013;0.979), which is considered excellent (<xref ref-type="bibr" rid="ref20">Landis and Koch, 1977</xref>), based on the average of all criteria and observations made on 258 records corresponding to two matches.</p>
</sec>
<sec id="sec6">
<label>2.4</label>
<title>Data cleaning and preprocessing</title>
<p>Once the data matrix was obtained, consisting of 2,346 ball possession records, the following cleaning and preprocessing tasks were performed using the Scikit-Learn library (<xref ref-type="bibr" rid="ref36">Pedregosa et al., 2011</xref>): (i) Checking for null values (none were found), (ii) Mapping the Possession Outcome variable into two binary recodings (Recoding 1: Success&#x202F;=&#x202F;Goal or Shot, No Success&#x202F;=&#x202F;Rest of the possessions &#x0026; Recoding 2: Success&#x202F;=&#x202F;Goal, No Success&#x202F;=&#x202F;Rest of the possessions), (iii) Scaling of quantitative variables using the MinMaxScaler technique due to the skewness of the distribution (<xref ref-type="fig" rid="fig1">Figure 1</xref>), (iv) Applying OneHotEncoding to categorical variables.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption><p>Initial distribution of quantitative variables.</p></caption>
<graphic xlink:href="fpsyg-16-1516417-g001.tif"/>
</fig>
<p>When the dataset was preprocessed, an oversampling process was performed on the unbalanced class in both recodings (Success) using the Imbalanced Learn library (<xref ref-type="bibr" rid="ref23">Lemaitre et al., 2017</xref>) which adjusted the classes to 50%. <xref ref-type="fig" rid="fig2">Figure 2</xref> presents the percentage of positive cases for the target variable, considering success as a goal (<xref ref-type="fig" rid="fig2">Figures 2A</xref>,<xref ref-type="fig" rid="fig2">B</xref>) and as both a goal and a shot (<xref ref-type="fig" rid="fig2">Figures 2C</xref>,<xref ref-type="fig" rid="fig2">D</xref>). The oversampling process was carried out using SMOTE, due to its performance in model training in other studies (<xref ref-type="bibr" rid="ref21">Last et al., 2017</xref>).</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption><p>Initial distribution of success and no success classes for the two recodings before and after oversampling. <bold>(A)</bold> Percentage of goals in the original dataset, <bold>(B)</bold> percentage of goals in the resampled dataset, <bold>(C)</bold> percentage of goals or shots in the original dataset, <bold>(D)</bold> percentage of goals or shots in the resampled dataset.</p></caption>
<graphic xlink:href="fpsyg-16-1516417-g002.tif"/>
</fig>
</sec>
<sec id="sec7">
<label>2.5</label>
<title>Data analysis</title>
<p>Once the datasets were resampled, the supervised machine learning models were trained using the Random Forest and XGBoost techniques, both implemented in the Scikit-Learn (<xref ref-type="bibr" rid="ref36">Pedregosa et al., 2011</xref>) and XGBoost (<xref ref-type="bibr" rid="ref10">Chen and Guestrin, 2016</xref>) libraries, respectively. The selection of these two algorithms is justified in this work to evaluate the classification capacity of different model combinations. In this context, the Random Forest model is considered one of the most powerful Bagging techniques, while XGBoost is classified within the Boosting techniques. The search for the best model was conducted through a cross-validation procedure using 5 folds on the training sample, which consisted of 80% of the total dataset. A grid search was performed using the following combination of hyperparameters:</p>
<list list-type="simple">
<list-item><p>- Random Forest Technique: (i) n_stimators (200, 300), (ii) max_depth (None, 10, 20, 30), (iii) min_samples_split (2, 5, 10), (iv) min_samples_leaf (1, 2, 4), and (v) Bootstrap (True, False)</p></list-item>
<list-item><p>- XGBoost: (i) n_stimators (200, 300), (ii) max_depth (3, 6, 9), (iii) learning_rate (0.01, 0.1, 0.2), (iv) subsample (0.6, 0.8, 1), and (v) subsample_by_tree (0.6, 0.8, 1)</p></list-item>
</list>
<p>Once the best model was obtained, it was trained on the resampled dataset, and its performance was evaluated on both the resampled test set and the original test set. All the steps carried out are published in the following repository (<ext-link xlink:href="https://doi.org/10.6084/m9.figshare.27109405" ext-link-type="uri">https://doi.org/10.6084/m9.figshare.27109405</ext-link>) and the dataset is available at the following link (<ext-link xlink:href="https://doi.org/10.6084/m9.figshare.27109414" ext-link-type="uri">https://doi.org/10.6084/m9.figshare.27109414</ext-link>).</p>
</sec>
</sec>
<sec sec-type="results" id="sec8">
<label>3</label>
<title>Results</title>
<p>For both recoding 1 and recoding 2, the Random Forest algorithm demonstrated higher performance compared to the XGBoost algorithm. The combination of hyperparameters that provided the best performance for recoding 1 (Goal or Shot) was Random Forest: (i) n_estimators&#x202F;=&#x202F;200, (ii) max_depth&#x202F;=&#x202F;None, (iii) min_samples_split&#x202F;=&#x202F;5, (iv) min_samples_leaf&#x202F;=&#x202F;1, Bootstrap&#x202F;=&#x202F;False. Similarly, for recoding 2 (Goal), the best performance was achieved with the following Random Forest combination: (i) n_estimators&#x202F;=&#x202F;300, (ii) max_depth&#x202F;=&#x202F;None, (iii) min_samples_split&#x202F;=&#x202F;5, (iv) min_samples_leaf&#x202F;=&#x202F;1, Bootstrap&#x202F;=&#x202F;False.</p>
<sec id="sec9">
<label>3.1</label>
<title>Results of the classification models</title>
<p>The results of the classification models are presented in the form of a confusion matrix in <xref ref-type="fig" rid="fig3">Figure 3</xref>. Additionally, a summary of the main evaluation metrics is provided in <xref ref-type="table" rid="tab2">Table 2</xref>. Overall, the models demonstrated excellent performance on the resampled test sets (recall&#x202F;=&#x202F;0.93 and 0.98 for the first and second recoding, respectively). However, on the original test sets, the model was unable to generalize, showing an incomplete ability to predict the &#x201C;Goal&#x201D; outcome, with a recall of 0.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption><p>Confusion matrix of the model on the resampled and original test set (recoding 1 and 2).</p></caption>
<graphic xlink:href="fpsyg-16-1516417-g003.tif"/>
</fig>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption><p>Summary report of the models trained.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th align="center" valign="top" colspan="2">Goal or shot prediction</th>
<th align="center" valign="top" colspan="2">Goal prediction</th>
</tr>
<tr>
<th/>
<th align="center" valign="top">Resampled test set</th>
<th align="center" valign="top">Original test set</th>
<th align="center" valign="top">Resampled test set</th>
<th align="center" valign="top">Original test set</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top" colspan="5">Random Forest model</td>
</tr>
<tr>
<td align="left" valign="top">Accuracy</td>
<td align="center" valign="top">0.95</td>
<td align="center" valign="top">0.95</td>
<td align="center" valign="top">0.99</td>
<td align="center" valign="top">0.99</td>
</tr>
<tr>
<td align="left" valign="top">Recall</td>
<td align="center" valign="top">0.93</td>
<td align="center" valign="top">0.13</td>
<td align="center" valign="top">0.98</td>
<td align="center" valign="top">0</td>
</tr>
<tr>
<td align="left" valign="top">Specifity</td>
<td align="center" valign="top">0.97</td>
<td align="center" valign="top">0.98</td>
<td align="center" valign="top">0.99</td>
<td align="center" valign="top">1</td>
</tr>
<tr>
<td align="left" valign="top" colspan="5">XGBoost model</td>
</tr>
<tr>
<td align="left" valign="top">Accuracy</td>
<td align="center" valign="top">0.95</td>
<td align="center" valign="top">0.90</td>
<td align="center" valign="top">0.99</td>
<td align="center" valign="top">0.99</td>
</tr>
<tr>
<td align="left" valign="top">Recall</td>
<td align="center" valign="top">0.92</td>
<td align="center" valign="top">0.10</td>
<td align="center" valign="top">1</td>
<td align="center" valign="top">0</td>
</tr>
<tr>
<td align="left" valign="top">Specifity</td>
<td align="center" valign="top">0.97</td>
<td align="center" valign="top">0.97</td>
<td align="center" valign="top">0.98</td>
<td align="center" valign="top">1</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec10">
<label>3.2</label>
<title>Influence of predictor variables on the model output</title>
<p><xref ref-type="fig" rid="fig4">Figure 4</xref> shows the influence of predictor variables on the model output for recoding 1 (Success&#x202F;=&#x202F;Goal or Shot). It was observed that the variable with the greatest influence was the duration of the attack in the opponent&#x2019;s half, with higher values of this variable increasing the likelihood of a positive model output. Next, the variables with the most significant influence were the Possession Zone (dichotomous variables), confirming previous findings. Similarly, an initial offensive intention to progress increased the probability of a positive model output.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption><p>Influence of predictor variables on the model output (Success&#x202F;=&#x202F;Shot or Goal). In the left figure, the overall influence of the predictor variables is presented. In the right figure, the influence is shown based on the value of the predictor variable: pink colors indicate high values for the predictor variable, and blue colors indicate low values. For example, in the case of the first variable (MO_seconds), the blue colors are located to the left of the X-axis (below 0), indicating that when the variable has low values (short possession duration in the opponent&#x2019;s half), the model decreases the likelihood of predicting the positive class (e.g., Goal or Shot). Lastly, for dichotomous variables (e.g., Offensive_intention_progress), the pink colors indicate the positive class of that variable (i.e., if there was an initial offensive intention to progress, then it is more likely that the model will predict the positive class for the target variable).</p></caption>
<graphic xlink:href="fpsyg-16-1516417-g004.tif"/>
</fig>
<p>For the variable Passes, the color distribution observed on the X-axis indicated that possessions with mid-range values (purple colors located towards the right of the X-axis) increased the likelihood of obtaining a positive output. Lastly, the starting lane of possessions also had an influence: while possessions that began in the central lane increased the probability of a positive model result, those that started on the left and right lanes had a negative influence.</p>
<p>In <xref ref-type="fig" rid="fig5">Figure 5</xref>, the observed influence in 4 random cases from the original dataset is presented for each of the features recorded in those elements, which allows us to gain an individual understanding of the influence of these variables on the specific actions analyzed.</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption><p>Influence of the features recorded in 4 random cases from the dataset on the model&#x2019;s output. Pink colors indicate an increase in the probability that the model&#x2019;s output will be the positive class of the target variable.</p></caption>
<graphic xlink:href="fpsyg-16-1516417-g005.tif"/>
</fig>
<p>Lastly, <xref ref-type="fig" rid="fig6">Figure 6</xref> presents the overall influence of the predictor variables on the model&#x2019;s output for recoding 2 (Success&#x202F;=&#x202F;Goal). In this model, the variable with the greatest influence was Match Outcome (Winner), followed by the variables Possession Zone (MO), Start Zone Width (Central), Possession Time in Opponent&#x2019;s Field, and Time (5Q). In this figure, an evident issue of collinearity between the target variable and the most influential variable in the model (Match Outcome&#x202F;=&#x202F;Winner) was observed, which may be the cause of the model&#x2019;s poor performance on the test set. Additionally, <xref ref-type="fig" rid="fig7">Figure 7</xref> presents the local influence of the recorded features in four specific cases from the analyzed dataset, aiming to show how the probabilities of success are modified based on the recorded variables.</p>
<fig position="float" id="fig6">
<label>Figure 6</label>
<caption><p>Influence of predictor variables on the model output (Success&#x202F;=&#x202F;Goal).</p></caption>
<graphic xlink:href="fpsyg-16-1516417-g006.tif"/>
</fig>
<fig position="float" id="fig7">
<label>Figure 7</label>
<caption><p>Influence of recorded features in 4 random cases from the dataset on the model&#x2019;s output.</p></caption>
<graphic xlink:href="fpsyg-16-1516417-g007.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="sec11">
<label>4</label>
<title>Discussion</title>
<p>The objective of this study was, first, to create two binary classification models that could predict the outcome of ball possessions in elite women&#x2019;s football. Additionally, once the models were trained, the aim was to identify the technical-tactical indicators associated with a higher probability of achieving a goal or a shot during ball possessions. To achieve these objectives, a mapping of the Possession Outcome variable was performed based on the degree of success (Goal or Shot). Following this, oversampling of the imbalanced class was conducted.</p>
<p>Previous studies have employed similar procedures with the aim of predicting the outcome of ball possessions in women&#x2019;s football. However, in most of these studies, success was defined as reaching the penalty area, reaching the final third, or, more generally, the creation of Goal Scoring Opportunities (<xref ref-type="bibr" rid="ref43">Scanlan et al., 2020</xref>; <xref ref-type="bibr" rid="ref19">Kubayi, 2022</xref>; <xref ref-type="bibr" rid="ref32">Mitrotasios et al., 2022</xref>; <xref ref-type="bibr" rid="ref31">Mesquita et al., 2023</xref>). This aspect is crucial when training a classification model, as approximately one in four (25%) ball possessions in women&#x2019;s football ends with a move into the final third or the opponent&#x2019;s penalty area (<xref ref-type="bibr" rid="ref15">Iv&#x00E1;n-Baraga&#x00F1;o et al., 2021</xref>; <xref ref-type="bibr" rid="ref9">Casal et al., 2023</xref>), allowing a balance between correctly classified positive and negative cases. In contrast, in this study, the dataset showed a percentage of positive cases of 1.35 and 8.28%, respectively, which necessitated oversampling of the imbalanced classes to prevent the model from ignoring the minority class (<xref ref-type="bibr" rid="ref13">Haller et al., 2023</xref>).</p>
<p>The classification models yielded excellent results on the resampled datasets, with recall and specificity exceeding 93% in both models. However, their performance on the original datasets was poor. When predicting shots or goals, the model had a recall of 13%, and in the case of goal prediction, the model did not predict any positive outcomes. These results highlight the difficulty of predicting infrequent events in football, such as shots and goals, and underscore the need for incorporating a larger number of predictor variables, as well as further tuning the hyperparameters during model training. Similarly, as seen in injury prediction, where different studies have shown recalls between 10 and 15% (<xref ref-type="bibr" rid="ref13">Haller et al., 2023</xref>; <xref ref-type="bibr" rid="ref27">Majumdar et al., 2024</xref>), the holistic nature of the sport contributes to the challenge of accurately predicting such events.</p>
<p>In relation to the SHAP technique (<xref ref-type="bibr" rid="ref26">Lundberg and Lee, 2017</xref>) applied in this study, it was found that a large number of indicators associated with ball possessions contributed to increasing the probability of a favorable outcome for the executing team. The performance indicators associated with successful ball possessions in elite women&#x2019;s football observed in this work largely align with previous studies on this topic. In this regard, <xref ref-type="bibr" rid="ref29">Maneiro et al. (2022)</xref> demonstrated that developing ball possessions in the opponent&#x2019;s half increased the likelihood of the possessions ending with a delivery into the penalty area. Similarly, the offensive tactical intent once ball possession was initiated, or the number of passes made in the offensive sequence, were variables that significantly altered the outcome of ball possessions in women&#x2019;s football (<xref ref-type="bibr" rid="ref43">Scanlan et al., 2020</xref>; <xref ref-type="bibr" rid="ref15">Iv&#x00E1;n-Baraga&#x00F1;o et al., 2021</xref>; <xref ref-type="bibr" rid="ref9">Casal et al., 2023</xref>).</p>
<p>However, considering that the level of success analyzed in this study was higher than in previous studies, this work also demonstrated the existence of variables that had not previously shown a multivariate influence on the outcome of ball possessions. For example, in the study by <xref ref-type="bibr" rid="ref16">Iv&#x00E1;n-Baraga&#x00F1;o et al. (2022)</xref>, it was observed that the current match score had an influence on the development and outcome of ball possessions. Thus, it is interesting to note that, while success in delivering the ball into the penalty area can be influenced by the flow of the game, when it comes to taking a shot or scoring a goal, this variable does not have sufficient influence. This insight may have significant implications for the sport, as it could suggest that when teams are losing, they tend to deliver the ball into the penalty area more often but are less successful in converting these deliveries into shots or goals.</p>
<p>Similarly, it is interesting to analyze the influence of the variables Time (5Q and 6Q) and Start Zone Width (Central). According to the SHAP values generated for these variables, the following insights can be drawn. When predicting a shot, the likelihood increases if the possession occurs in the last 15&#x202F;min of the match (6Q). However, when analyzing the SHAP values for the positive outcome &#x201C;Goal,&#x201D; the probability increases between the 60th and 75th minutes of the match. This contradicts the findings from the 1999, 2003, and 2007 World Cups, where a higher number of goals were observed in the final 15&#x202F;min of the match (<xref ref-type="bibr" rid="ref5">Armatas et al., 2007</xref>), as well as the results from the most recent Women&#x2019;s Euro 2022 (<xref ref-type="bibr" rid="ref42">Sanmiguel-Codina et al., 2025</xref>).</p>
<p>Additionally, the observation that starting an attack in the central lane (Start Zone Width&#x202F;=&#x202F;Central) increases the probability of success had not been noted in previous studies (<xref ref-type="bibr" rid="ref43">Scanlan et al., 2020</xref>; <xref ref-type="bibr" rid="ref15">Iv&#x00E1;n-Baraga&#x00F1;o et al., 2021</xref>; <xref ref-type="bibr" rid="ref29">Maneiro et al., 2022</xref>). This may suggest that while starting attacks from wide areas may facilitate successful entries into the penalty area, shots and goals are more likely to result from attacks initiated in central zones.</p>
<p>This study presents several limitations that should be addressed in future research. First, while the classification models achieved excellent performance on oversampled datasets using the SMOTE technique, their ability to detect true positives in the original dataset was notably poor. From a football perspective, this suggests that the actions leading to dangerous situations may follow highly specific patterns that generic classification models, such as Random Forest, are unable to effectively capture. In this context, future studies might benefit from the implementation of advanced statistical techniques like T-Patterns, which have proven effective in identifying offensive patterns and sequences in other sports (<xref ref-type="bibr" rid="ref37">Pic and Jonsson, 2021</xref>; <xref ref-type="bibr" rid="ref38">Pic et al., 2021</xref>). Additionally, exploring alternative tools to mitigate overfitting during model training is essential. Expanding the dataset by analyzing additional championships could also enhance the robustness of the identified patterns related to goal scoring. Furthermore, the inclusion of certain predictor variables, such as Match Outcome, was found to influence model performance, not due to their predictive capability, but because of their retrospective causal relationship (e.g., the winning team scored more goals). This introduces data leakage during model training. Consequently, future research should consider excluding such variables from the training process to ensure more reliable and generalizable results.</p>
</sec>
<sec sec-type="conclusions" id="sec12">
<label>5</label>
<title>Conclusion</title>
<p>The models trained and tested in this study showed excellent performance on the resampled datasets using the SMOTE technique (<xref ref-type="bibr" rid="ref21">Last et al., 2017</xref>). However, when these models were evaluated on the original dataset, their performance was low or non-existent. In the case of predicting Goals or Shots, the model achieved a recall of 13%, which slightly increased the relative frequency of the positive class but fell far short of an acceptable performance. For goal prediction, the model was unable to output the positive class at all. Based on this, it can be stated that such events in elite women&#x2019;s football possess very specific characteristics and patterns that cannot be clearly defined or that, at least, involve variables not analyzed in this study.</p>
<p>On the other hand, the SHAP explainability techniques applied in this study allowed for the identification of various variables associated with the achievement of goals and shots. Some of these variables showed similarities to previous studies, where success was categorized as entries into the penalty area or similar metrics. However, other variables such as start zone width, timing, or defensive intent had a significant influence on the model when analyzing a higher degree of success, enabling a tactical understanding of how these types of actions occur.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec13">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/supplementary material.</p>
</sec>
<sec sec-type="author-contributions" id="sec14">
<title>Author contributions</title>
<p>II-B: Data curation, Investigation, Methodology, Software, Supervision, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. AA: Formal analysis, Investigation, Supervision, Validation, Writing &#x2013; review &#x0026; editing. JL: Methodology, Writing &#x2013; review &#x0026; editing. RM: Conceptualization, Investigation, Supervision, Validation, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec sec-type="funding-information" id="sec15">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<sec sec-type="COI-statement" id="sec16">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec17">
<title>Generative AI statement</title>
<p>The authors declare that no Gen AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="sec18">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Almeida</surname> <given-names>C. H.</given-names></name> <name><surname>Ferreira</surname> <given-names>A. P.</given-names></name> <name><surname>Volossovitch</surname> <given-names>A.</given-names></name></person-group> (<year>2014</year>). <article-title>Effects of match location, match status and quality of opposition on regaining possession in UEFA champions league</article-title>. <source>J. Hum. Kinet.</source> <volume>41</volume>, <fpage>203</fpage>&#x2013;<lpage>214</lpage>. doi: <pub-id pub-id-type="doi">10.2478/hukin-2014-0048</pub-id>, PMID: <pub-id pub-id-type="pmid">25114747</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>AlMulla</surname> <given-names>J.</given-names></name> <name><surname>Islam</surname> <given-names>M. T.</given-names></name> <name><surname>Al-Absi</surname> <given-names>H. R. H.</given-names></name> <name><surname>Alam</surname> <given-names>T.</given-names></name></person-group> (<year>2023</year>). <article-title>SoccerNet: a gated recurrent unit-based model to predict soccer match winners</article-title>. <source>PLoS One</source> <volume>18</volume>:<fpage>e0288933</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0288933</pub-id>, PMID: <pub-id pub-id-type="pmid">37527260</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anguera</surname> <given-names>M. T.</given-names></name></person-group> (<year>1979</year>). <article-title>Observational typology</article-title>. <source>Qual. Quant.</source> <volume>13</volume>, <fpage>44</fpage>&#x2013;<lpage>484</lpage>.</citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anguera</surname> <given-names>M. T.</given-names></name> <name><surname>Blanco-Villase&#x00F1;or</surname> <given-names>A.</given-names></name> <name><surname>Hern&#x00E1;ndez-Mendo</surname> <given-names>A.</given-names></name> <name><surname>Losada</surname> <given-names>J. L.</given-names></name></person-group> (<year>2011</year>). <article-title>Dise&#x00F1;os Observacionales: Ajuste y Aplicaci&#x00F3;n en Psicolog&#x00ED;a del Deporte [Observational designs: adjust and applications in sport psychology]</article-title>. <source>Cuad. Psicol. Deporte.</source> <volume>11</volume>, <fpage>63</fpage>&#x2013;<lpage>76</lpage>.</citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Armatas</surname> <given-names>V.</given-names></name> <name><surname>Yiannakos</surname> <given-names>A.</given-names></name> <name><surname>Galazoulas</surname> <given-names>C.</given-names></name> <name><surname>Hatzimanouil</surname> <given-names>D.</given-names></name></person-group> (<year>2007</year>). <article-title>Goal scoring patterns over the course of a match: analysis of Women&#x2019;s high standard soccer matches</article-title>. <source>Phys. Train.</source></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bradley</surname> <given-names>P. S.</given-names></name></person-group> (<year>2025a</year>). <article-title>&#x2018;Setting the benchmark&#x2019; part 3: Contextualising the match demands of specialised positions at the FIFA Women&#x2019;s world cup Australia and New Zealand 2023</article-title>. <source>Biol. Sport</source> <volume>42</volume>, <fpage>99</fpage>&#x2013;<lpage>111</lpage>. doi: <pub-id pub-id-type="doi">10.5114/biolsport.2025.139857</pub-id>, PMID: <pub-id pub-id-type="pmid">39758172</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bradley</surname> <given-names>P. S.</given-names></name></person-group> (<year>2025b</year>). <article-title>&#x2018;Setting the benchmark&#x2019; part 4: Contextualising the match demands of teams at the FIFA Women&#x2019;s world cup Australia and New Zealand 2023</article-title>. <source>Biol. Sport</source> <volume>42</volume>, <fpage>57</fpage>&#x2013;<lpage>69</lpage>. doi: <pub-id pub-id-type="doi">10.5114/biolsport.2025.142638</pub-id>, PMID: <pub-id pub-id-type="pmid">39649281</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Branquinho</surname> <given-names>L.</given-names></name> <name><surname>de Fran&#x00E7;a</surname> <given-names>E.</given-names></name> <name><surname>Teixeira</surname> <given-names>J. E.</given-names></name> <name><surname>Paiva</surname> <given-names>E.</given-names></name> <name><surname>Forte</surname> <given-names>P.</given-names></name> <name><surname>Thomatieli-Santos</surname> <given-names>R. V.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Relationship between key offensive performance indicators and match running performance in the FIFA Women&#x2019;s world cup 2023</article-title>. <source>Int. J. Perform. Anal. Sport</source>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. doi: <pub-id pub-id-type="doi">10.1080/24748668.2024.2335460</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Casal</surname> <given-names>C.</given-names></name> <name><surname>Stone</surname> <given-names>J.</given-names></name> <name><surname>Iv&#x00E1;n-Baraga&#x00F1;o</surname> <given-names>I.</given-names></name> <name><surname>Losada</surname> <given-names>J.</given-names></name></person-group> (<year>2023</year>). <article-title>Effect of goalkeepers&#x2019; offensive participation on team performance in the women Spanish La Liga: a multinomial logistic regression analysis</article-title>. <source>Biol. Sport</source> <volume>41</volume>, <fpage>29</fpage>&#x2013;<lpage>39</lpage>. doi: <pub-id pub-id-type="doi">10.5114/biolsport.2024.125592</pub-id>, PMID: <pub-id pub-id-type="pmid">38188123</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>T.</given-names></name> <name><surname>Guestrin</surname> <given-names>C.</given-names></name></person-group> (<year>2016</year>). XGBoost: a scalable tree boosting system, in <italic>Proceedings of the ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</italic> (Association for Computing Machinery), 785&#x2013;794. doi: <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Claudino</surname> <given-names>J. G.</given-names></name> <name><surname>Capanema</surname> <given-names>D. D. O.</given-names></name> <name><surname>De Souza</surname> <given-names>T. V.</given-names></name> <name><surname>Serr&#x00E3;o</surname> <given-names>J. C.</given-names></name> <name><surname>Machado Pereira</surname> <given-names>A. C.</given-names></name> <name><surname>Nassis</surname> <given-names>G. P.</given-names></name></person-group> (<year>2019</year>). <article-title>Current approaches to the use of artificial intelligence for injury risk assessment and performance prediction in team sports: a systematic review</article-title>. <source>Sports Med Open</source> <volume>5</volume>:<fpage>28</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s40798-019-0202-3</pub-id>, PMID: <pub-id pub-id-type="pmid">31270636</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cohen</surname> <given-names>J.</given-names></name></person-group> (<year>1960</year>). <article-title>A coefficient of agreement for nominal scales</article-title>. <source>Educ. Psychol. Meas.</source> <volume>20</volume>, <fpage>37</fpage>&#x2013;<lpage>46</lpage>. doi: <pub-id pub-id-type="doi">10.1177/001316446002000104</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haller</surname> <given-names>N.</given-names></name> <name><surname>Kranzinger</surname> <given-names>S.</given-names></name> <name><surname>Kranzinger</surname> <given-names>C.</given-names></name> <name><surname>Blumkaitis</surname> <given-names>J. C.</given-names></name> <name><surname>Strepp</surname> <given-names>T.</given-names></name> <name><surname>Simon</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Predicting injury and illness with machine learning in elite youth soccer: a comprehensive monitoring approach over 3 months</article-title>. <source>J. Sports Sci. Med.</source> <volume>22</volume>, <fpage>476</fpage>&#x2013;<lpage>487</lpage>. doi: <pub-id pub-id-type="doi">10.52082/jssm.2023.476</pub-id>, PMID: <pub-id pub-id-type="pmid">37711721</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hughes</surname> <given-names>M. D.</given-names></name> <name><surname>Bartlett</surname> <given-names>R. M.</given-names></name></person-group> (<year>2002</year>). <article-title>The use of performance indicators in performance analysis</article-title>. <source>J. Sports Sci.</source> <volume>20</volume>, <fpage>739</fpage>&#x2013;<lpage>754</lpage>. doi: <pub-id pub-id-type="doi">10.1080/026404102320675602</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iv&#x00E1;n-Baraga&#x00F1;o</surname> <given-names>I.</given-names></name> <name><surname>Maneiro</surname> <given-names>R.</given-names></name> <name><surname>Losada</surname> <given-names>J. L.</given-names></name> <name><surname>Ard&#x00E1;</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>Multivariate analysis of the offensive phase in high-performance women&#x2019;s soccer: a mixed methods study</article-title>. <source>Sustain.</source> <volume>13</volume>. doi: <pub-id pub-id-type="doi">10.3390/su13116379</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iv&#x00E1;n-Baraga&#x00F1;o</surname> <given-names>I.</given-names></name> <name><surname>Maneiro</surname> <given-names>R.</given-names></name> <name><surname>Losada</surname> <given-names>J. L.</given-names></name> <name><surname>Ard&#x00E1;</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>Influence of match status in ball possessions in the FIFA Women&#x2019;s world cup France 2019</article-title>. <source>Proc. Inst. Mech. Eng. P J. Sport Eng. Technol.</source> <volume>175433712211336</volume>. doi: <pub-id pub-id-type="doi">10.1177/17543371221133624</pub-id>, PMID: <pub-id pub-id-type="pmid">39841202</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iv&#x00E1;n-Baraga&#x00F1;o</surname> <given-names>I.</given-names></name> <name><surname>Maneiro</surname> <given-names>R.</given-names></name> <name><surname>Losada</surname> <given-names>J.</given-names></name> <name><surname>Ard&#x00E1;</surname> <given-names>A.</given-names></name></person-group> (<year>2025</year>). <article-title>Technical-tactical evolution of women&#x2019;s football: a comparative analysis of ball possessions in the FIFA Women&#x2019;s world cup France 2019 and Australia &#x0026; New Zealand 2023</article-title>. <source>Biol. Sport</source> <volume>42</volume>, <fpage>11</fpage>&#x2013;<lpage>20</lpage>. doi: <pub-id pub-id-type="doi">10.5114/biolsport.2025.139077</pub-id>, PMID: <pub-id pub-id-type="pmid">39758169</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kirkendall</surname> <given-names>D. T.</given-names></name></person-group> (<year>2007</year>). <article-title>Issues in training the female player</article-title>. <source>Br. J. Sports Med.</source> <volume>41</volume>, <fpage>i64</fpage>&#x2013;<lpage>i67</lpage>. doi: <pub-id pub-id-type="doi">10.1136/bjsm.2007.036970</pub-id>, PMID: <pub-id pub-id-type="pmid">17504787</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kubayi</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>The creation of goal-scoring opportunities at the 2019 FIFA Women&#x2019;s World Cup</article-title>. <source>J. Hum. Kinet.</source> <volume>82</volume>, <fpage>165</fpage>&#x2013;<lpage>172</lpage>. doi: <pub-id pub-id-type="doi">10.2478/hukin-2022-0043</pub-id>, PMID: <pub-id pub-id-type="pmid">36196349</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Landis</surname> <given-names>J. R.</given-names></name> <name><surname>Koch</surname> <given-names>G. G.</given-names></name></person-group> (<year>1977</year>). <article-title>The measurement of observer agreement for categorical data</article-title>. <source>Biometrics</source> <volume>33</volume>, <fpage>159</fpage>&#x2013;<lpage>174</lpage>. doi: <pub-id pub-id-type="doi">10.2307/2529310</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Last</surname> <given-names>F.</given-names></name> <name><surname>Douzas</surname> <given-names>G.</given-names></name> <name><surname>Bacao</surname> <given-names>F.</given-names></name></person-group> (<year>2017</year>). Oversampling for imbalanced learning based on K-means and SMOTE. <italic>arXiv:1711.00837</italic>. doi: <pub-id pub-id-type="doi">10.1016/j.ins.2018.06.056</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>J.</given-names></name> <name><surname>Mills</surname> <given-names>S.</given-names></name></person-group> (<year>2021</year>). <article-title>Analysis of corner kicks at the FIFA Women&#x2019;s world cup 2019 in relation to match status and team quality</article-title>. <source>Int. J. Perform. Anal. Sport</source> <volume>21</volume>, <fpage>679</fpage>&#x2013;<lpage>699</lpage>. doi: <pub-id pub-id-type="doi">10.1080/24748668.2021.1936408</pub-id></citation></ref>
<ref id="ref47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leite</surname> <given-names>W. S.</given-names></name></person-group> (<year>2013</year>). <article-title>Analysis of goals in soccer world cups and the determination of the critical phase of the game</article-title>. <source>Facta Univ.</source> <volume>11</volume>, <fpage>247</fpage>&#x2013;<lpage>253</lpage>.</citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lemaitre</surname> <given-names>G.</given-names></name> <name><surname>Nogeuira</surname> <given-names>F.</given-names></name> <name><surname>Aridas Char</surname> <given-names>C. K.</given-names></name></person-group> (<year>2017</year>). <article-title>Imbalanced-learn: a Python toolbox to tackle the curse of imbalanced datasets in machine learning</article-title>. <source>J. Mach. Learn. Res.</source> <volume>18</volume>, <fpage>1</fpage>&#x2013;<lpage>5</lpage>. doi: <pub-id pub-id-type="doi">10.48550/arXiv.1609.06570</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Losada</surname> <given-names>J. L.</given-names></name> <name><surname>Manolov</surname> <given-names>R.</given-names></name></person-group> (<year>2015</year>). <article-title>The process of basic training, applied training, maintenance an observer</article-title>. <source>Qual. Quant.</source> <volume>49</volume>, <fpage>339</fpage>&#x2013;<lpage>347</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s11135-014-9989-7</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Low</surname> <given-names>B.</given-names></name> <name><surname>Coutinho</surname> <given-names>D.</given-names></name> <name><surname>Gon&#x00E7;alves</surname> <given-names>B.</given-names></name> <name><surname>Rein</surname> <given-names>R.</given-names></name> <name><surname>Memmert</surname> <given-names>D.</given-names></name> <name><surname>Sampaio</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>A systematic review of collective tactical behaviours in football using positional data</article-title>. <source>Sports Med.</source> <volume>50</volume>, <fpage>343</fpage>&#x2013;<lpage>385</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s40279-019-01194-7</pub-id>, PMID: <pub-id pub-id-type="pmid">31571155</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Lundberg</surname> <given-names>S. M.</given-names></name> <name><surname>Lee</surname> <given-names>S. I.</given-names></name></person-group> (<year>2017</year>). A unified approach to interpreting model predictions, in <italic>31st Conference on Neural Information Processing Systems</italic>. doi: <pub-id pub-id-type="doi">10.48550/arXiv.1705.07874</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Majumdar</surname> <given-names>A.</given-names></name> <name><surname>Bakirov</surname> <given-names>R.</given-names></name> <name><surname>Hodges</surname> <given-names>D.</given-names></name> <name><surname>McCullagh</surname> <given-names>S.</given-names></name> <name><surname>Rees</surname> <given-names>T.</given-names></name></person-group> (<year>2024</year>). <article-title>A multi-season machine learning approach to examine the training load and injury relationship in professional soccer</article-title>. <source>J. Sports Anal.</source> <volume>10</volume>, <fpage>47</fpage>&#x2013;<lpage>65</lpage>. doi: <pub-id pub-id-type="doi">10.3233/JSA-240718</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maneiro</surname> <given-names>R.</given-names></name> <name><surname>Casal</surname> <given-names>C. A.</given-names></name> <name><surname>Ard&#x00E1;</surname> <given-names>A.</given-names></name> <name><surname>Losada</surname> <given-names>J. L.</given-names></name></person-group> (<year>2019</year>). <article-title>Application of multivariant decision tree technique in high performance football: the female and male corner kick</article-title>. <source>PLoS One</source> <volume>14</volume>:<fpage>e0212549</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0212549</pub-id>, PMID: <pub-id pub-id-type="pmid">30856199</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maneiro</surname> <given-names>R.</given-names></name> <name><surname>Iv&#x00E1;n-Baraga&#x00F1;o</surname> <given-names>I.</given-names></name> <name><surname>Losada</surname> <given-names>J. L.</given-names></name> <name><surname>Ard&#x00E1;</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>Deciphering the offensive process in women&#x2019;s elite football: a multivariate study</article-title>. <source>Scand. J. Med. Sci. Sports</source> <volume>32</volume>, <fpage>1650</fpage>&#x2013;<lpage>1659</lpage>. doi: <pub-id pub-id-type="doi">10.1111/sms.14206</pub-id>, PMID: <pub-id pub-id-type="pmid">35801395</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mara</surname> <given-names>J. K.</given-names></name> <name><surname>Wheeler</surname> <given-names>K. W.</given-names></name> <name><surname>Lyons</surname> <given-names>K.</given-names></name></person-group> (<year>2012</year>). <article-title>Attacking strategies that Lead to goal scoring opportunities in high level Women&#x2019;s football</article-title>. <source>Int. J. Sports Sci. Coach.</source> <volume>7</volume>, <fpage>565</fpage>&#x2013;<lpage>577</lpage>. doi: <pub-id pub-id-type="doi">10.1260/1747-9541.7.3.565</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mesquita</surname> <given-names>P.</given-names></name> <name><surname>Silva</surname> <given-names>B.</given-names></name> <name><surname>Alexandre</surname> <given-names>M.</given-names></name> <name><surname>Rodrigues</surname> <given-names>P.</given-names></name></person-group> (<year>2023</year>). <article-title>Analysis of goal-scoring in an elite European women&#x2019;s football teams</article-title>. <source>Sustainability Sport Manage. J.</source> <volume>1</volume>, <fpage>16</fpage>&#x2013;<lpage>24</lpage>. doi: <pub-id pub-id-type="doi">10.61486/UUGA2681</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mitrotasios</surname> <given-names>M.</given-names></name> <name><surname>Gonz&#x00E1;lez-Rodenas</surname> <given-names>J.</given-names></name> <name><surname>Armatas</surname> <given-names>V.</given-names></name> <name><surname>Malav&#x00E9;s</surname> <given-names>R. A.</given-names></name></person-group> (<year>2022</year>). <article-title>Creating goal scoring opportunities in men and women UEFA champions league soccer matches</article-title>. <source>Tactical Similarities and Differences</source>. <publisher-loc>Retos, Nuevas Tendencias en Educaci&#x00F3;n F&#x00ED;sica</publisher-loc>: <publisher-name>Deporte y Recreaci&#x00F3;n</publisher-name>. <volume>43</volume>, <fpage>154</fpage>&#x2013;<lpage>161</lpage>. doi: <pub-id pub-id-type="doi">10.47197/retos.v43i0.88203</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nassis</surname> <given-names>G.</given-names></name> <name><surname>Verhagen</surname> <given-names>E.</given-names></name> <name><surname>Brito</surname> <given-names>J.</given-names></name> <name><surname>Figueiredo</surname> <given-names>P.</given-names></name> <name><surname>Krustrup</surname> <given-names>P.</given-names></name></person-group> (<year>2023</year>). <article-title>A review of machine learning applications in soccer with an emphasis on injury risk</article-title>. <source>Biol. Sport</source> <volume>40</volume>, <fpage>233</fpage>&#x2013;<lpage>239</lpage>. doi: <pub-id pub-id-type="doi">10.5114/biolsport.2023.114283</pub-id>, PMID: <pub-id pub-id-type="pmid">36636180</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Oliva-Lozano</surname> <given-names>J. M.</given-names></name> <name><surname>Yousefian</surname> <given-names>F.</given-names></name> <name><surname>Chmura</surname> <given-names>P.</given-names></name> <name><surname>Gabbett</surname> <given-names>T. J.</given-names></name> <name><surname>Cost</surname> <given-names>R.</given-names></name></person-group> (<year>2025</year>). <article-title>Analysis of FIFA 2023 Women&#x2019;s world cup match performance according to match outcome and phase of the tournament</article-title>. <source>Biol. Sport</source> <volume>42</volume>, <fpage>71</fpage>&#x2013;<lpage>84</lpage>. doi: <pub-id pub-id-type="doi">10.5114/biolsport.2025.142643</pub-id>, PMID: <pub-id pub-id-type="pmid">39649281</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pappalardo</surname> <given-names>L.</given-names></name> <name><surname>Rossi</surname> <given-names>A.</given-names></name> <name><surname>Natilli</surname> <given-names>M.</given-names></name> <name><surname>Cintia</surname> <given-names>P.</given-names></name></person-group> (<year>2021</year>). <article-title>Explaining the difference between men&#x2019;s and women&#x2019;s football</article-title>. <source>PLoS One</source> <volume>16</volume>:<fpage>e0255407</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0255407</pub-id>, PMID: <pub-id pub-id-type="pmid">34347829</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pedregosa</surname> <given-names>F.</given-names></name> <name><surname>Michel</surname> <given-names>V.</given-names></name> <name><surname>Grisel</surname> <given-names>O.</given-names></name> <name><surname>Blondel</surname> <given-names>M.</given-names></name> <name><surname>Prettenhofer</surname> <given-names>P.</given-names></name> <name><surname>Weiss</surname> <given-names>R.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Scikit-learn: machine learning in Python</article-title>. <source>J. Mach. Learn. Res.</source> <volume>12</volume>, <fpage>2825</fpage>&#x2013;<lpage>2830</lpage>. <comment>Available at:</comment> <ext-link xlink:href="http://scikit-learn.sourceforge.net" ext-link-type="uri">http://scikit-learn.sourceforge.net</ext-link></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pic</surname> <given-names>M.</given-names></name> <name><surname>Jonsson</surname> <given-names>G. K.</given-names></name></person-group> (<year>2021</year>). <article-title>Professional boxing analysis with T-patterns</article-title>. <source>Physiol. Behav.</source> <volume>232</volume>:<fpage>113329</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.physbeh.2021.113329</pub-id>, PMID: <pub-id pub-id-type="pmid">33493543</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pic</surname> <given-names>M.</given-names></name> <name><surname>Navarro-Adelantado</surname> <given-names>V.</given-names></name> <name><surname>Jonsson</surname> <given-names>G. K.</given-names></name></person-group> (<year>2021</year>). <article-title>Exploring playful asymmetries for gender-related decision-making through T-pattern analysis</article-title>. <source>Physiol. Behav.</source> <volume>236</volume>:<fpage>113421</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.physbeh.2021.113421</pub-id>, PMID: <pub-id pub-id-type="pmid">33848526</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Preciado</surname> <given-names>M.</given-names></name> <name><surname>Anguera</surname> <given-names>M. T.</given-names></name> <name><surname>Olarte</surname> <given-names>M.</given-names></name> <name><surname>Lapresa</surname> <given-names>D.</given-names></name></person-group> (<year>2019</year>). <article-title>Observational studies in male elite football: a systematic mixed study review</article-title>. <source>Front. Psychol.</source> <volume>10</volume>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2019.02077</pub-id>, PMID: <pub-id pub-id-type="pmid">31681054</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rico-Gonz&#x00E1;lez</surname> <given-names>M.</given-names></name> <name><surname>Pino-Ortega</surname> <given-names>J.</given-names></name> <name><surname>M&#x00E9;ndez</surname> <given-names>A.</given-names></name> <name><surname>Clemente</surname> <given-names>F.</given-names></name> <name><surname>Baca</surname> <given-names>A.</given-names></name></person-group> (<year>2023</year>). <article-title>Machine learning application in soccer: a systematic review</article-title>. <source>Biol. Sport</source> <volume>40</volume>, <fpage>249</fpage>&#x2013;<lpage>263</lpage>. doi: <pub-id pub-id-type="doi">10.5114/biolsport.2023.112970</pub-id>, PMID: <pub-id pub-id-type="pmid">36636183</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Robles-Palaz&#x00F3;n</surname> <given-names>F. J.</given-names></name> <name><surname>L&#x00F3;pez-Valenciano</surname> <given-names>A.</given-names></name> <name><surname>De Ste Croix</surname> <given-names>M.</given-names></name> <name><surname>Oliver</surname> <given-names>J. L.</given-names></name> <name><surname>Garc&#x00ED;a-G&#x00F3;mez</surname> <given-names>A.</given-names></name> <name><surname>Sainz de Baranda</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Epidemiology of injuries in male and female youth football players: a systematic review and meta-analysis</article-title>. <source>J. Sport Health Sci.</source> <volume>11</volume>, <fpage>681</fpage>&#x2013;<lpage>695</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jshs.2021.10.002</pub-id>, PMID: <pub-id pub-id-type="pmid">34700052</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanmiguel-Codina</surname> <given-names>J.</given-names></name> <name><surname>Ballester-Lengua</surname> <given-names>R.</given-names></name> <name><surname>Casal</surname> <given-names>C.</given-names></name> <name><surname>Huertas-Olmedo</surname> <given-names>F.</given-names></name></person-group> (<year>2025</year>). <article-title>Analysis of goal scoring patterns in the UEFA Women&#x2019;s EURO 2022</article-title>. <source>Biol. Sport</source> <volume>42</volume>, <fpage>45</fpage>&#x2013;<lpage>56</lpage>. doi: <pub-id pub-id-type="doi">10.5114/biolsport.2025.142646</pub-id>, PMID: <pub-id pub-id-type="pmid">39649281</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Scanlan</surname> <given-names>M.</given-names></name> <name><surname>Harms</surname> <given-names>C.</given-names></name> <name><surname>Cochrane Wilkie</surname> <given-names>J.</given-names></name> <name><surname>Ma&#x2019;ayah</surname> <given-names>F.</given-names></name></person-group> (<year>2020</year>). <article-title>The creation of goal scoring opportunities at the 2015 women&#x2019;s world cup</article-title>. <source>Int. J. Sports Sci. Coach.</source> <volume>15</volume>, <fpage>803</fpage>&#x2013;<lpage>808</lpage>. doi: <pub-id pub-id-type="doi">10.1177/1747954120942051</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shen</surname> <given-names>L.</given-names></name> <name><surname>Tan</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>Q.</given-names></name> <name><surname>Jiang</surname> <given-names>G.</given-names></name></person-group> (<year>2024</year>). <article-title>Tactics analysis and evaluation of women football team based on convolutional neural network</article-title>. <source>Sci. Rep.</source> <volume>14</volume>:<fpage>255</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-023-50056-w</pub-id>, PMID: <pub-id pub-id-type="pmid">38168541</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Soto-Fern&#x00E1;ndez</surname> <given-names>A.</given-names></name> <name><surname>Camerino</surname> <given-names>O.</given-names></name> <name><surname>Iglesias</surname> <given-names>X.</given-names></name> <name><surname>Anguera</surname> <given-names>M. T.</given-names></name> <name><surname>Casta&#x00F1;er</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>LINCE PLUS software for systematic observational studies in sports and health</article-title>. <source>Behav. Res. Methods</source> <volume>54</volume>, <fpage>1263</fpage>&#x2013;<lpage>1271</lpage>. doi: <pub-id pub-id-type="doi">10.3758/s13428-021-01642-1</pub-id>, PMID: <pub-id pub-id-type="pmid">34549384</pub-id></citation></ref>
<ref id="ref46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stival</surname> <given-names>L.</given-names></name> <name><surname>Pinto</surname> <given-names>A.</given-names></name> <name><surname>Andrade</surname> <given-names>F.</given-names></name> <name><surname>De</surname> <given-names>D. S. P.</given-names></name> <name><surname>Santiago</surname> <given-names>P. R. P.</given-names></name> <name><surname>Biermann</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Using machine learning pipeline to predict entry into the attack zone in football</article-title>. <source>PLoS One</source> <volume>18</volume>:<fpage>e0265372</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0265372</pub-id>, PMID: <pub-id pub-id-type="pmid">36652409</pub-id></citation></ref>
<ref id="ref48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Veli&#x010D;kovi&#x0107;</surname> <given-names>P.</given-names></name> <name><surname>Hennes</surname> <given-names>D.</given-names></name> <name><surname>Toma&#x0161;ev</surname> <given-names>N.</given-names></name> <name><surname>Prince</surname> <given-names>L.</given-names></name> <name><surname>Kaisers</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>TacticAI: an AI assistant for football tactics</article-title>. <source>Nat. Commun.</source> <volume>15</volume>:<fpage>1906</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-024-45965-x</pub-id>, PMID: <pub-id pub-id-type="pmid">38503774</pub-id></citation></ref>
</ref-list>
</back>
</article>