<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Sports Act. Living</journal-id>
<journal-title>Frontiers in Sports and Active Living</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Sports Act. Living</abbrev-journal-title>
<issn pub-type="epub">2624-9367</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fspor.2025.1646146</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Sports and Active Living</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Gait stability prediction through synthetic time-series and vision-based data</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes"><name><surname>Cordeiro</surname><given-names>Mauricio C.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="cor1">&#x002A;</xref><uri xlink:href="https://loop.frontiersin.org/people/3026502/overview"/><role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/><role content-type="https://credit.niso.org/contributor-roles/data-curation/"/><role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/><role content-type="https://credit.niso.org/contributor-roles/investigation/"/><role content-type="https://credit.niso.org/contributor-roles/methodology/"/><role content-type="https://credit.niso.org/contributor-roles/validation/"/><role content-type="https://credit.niso.org/contributor-roles/visualization/"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Cathain</surname><given-names>Ciaran O.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2010543/overview" />
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Nascimento</surname><given-names>Vitor B.</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/1217818/overview" />
<role content-type="https://credit.niso.org/contributor-roles/resources/"/><role content-type="https://credit.niso.org/contributor-roles/software/"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
<contrib contrib-type="author"><name><surname>Rodrigues</surname><given-names>Thiago B.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref><uri xlink:href="https://loop.frontiersin.org/people/3071899/overview" /><role content-type="https://credit.niso.org/contributor-roles/project-administration/"/><role content-type="https://credit.niso.org/contributor-roles/supervision/"/><role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/><role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/></contrib>
</contrib-group>
<aff id="aff1"><label><sup>1</sup></label><institution>Department of Engineering &#x0026; Informatics, Technological University of the Shannon</institution>, <addr-line>Athlone</addr-line>, <country>Ireland</country></aff>
<aff id="aff2"><label><sup>2</sup></label><institution>Department of Sport &#x0026; Health Sciences, Technological University of the Shannon</institution>, <addr-line>Athlone</addr-line>, <country>Ireland</country></aff>
<aff id="aff3"><label><sup>3</sup></label><institution>SHE Research Centre, Technological University of the Shannon</institution>, <addr-line>Athlone</addr-line>, <country>Ireland</country></aff>
<aff id="aff4"><label><sup>4</sup></label><institution>Department of Sport Science and Nutrition, Faculty of Science and Engineering, Maynooth University</institution>, <addr-line>Maynooth</addr-line>, <country>Ireland</country></aff>
<aff id="aff5"><label><sup>5</sup></label><institution>Department of Physical Education, Pontif&#x00ED;cia Universidade Cat&#x00F3;lica do Paran&#x00E1;</institution>, <addr-line>Curitiba</addr-line>, <country>Brazil</country></aff>
<author-notes>
<fn fn-type="edited-by"><p><bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1632683/overview">Guoxin Zhang</ext-link>, The Hong Kong Polytechnic University, Hong Kong SAR, China</p></fn>
<fn fn-type="edited-by"><p><bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1719164/overview">Fei Yan</ext-link>, Chongqing Three Gorges Central Hospital, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3112151/overview">Zhongyou Li</ext-link>, Sichuan University, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3130019/overview">Chenxi Yan</ext-link>, Beihang University, China</p></fn>
<corresp id="cor1"><label>&#x002A;</label><bold>Correspondence:</bold> Mauricio C. Cordeiro <email>mauricio.cordeiro@tus.ie</email></corresp>
</author-notes>
<pub-date pub-type="epub"><day>13</day><month>08</month><year>2025</year></pub-date>
<pub-date pub-type="collection"><year>2025</year></pub-date>
<volume>7</volume><elocation-id>1646146</elocation-id>
<history>
<date date-type="received"><day>12</day><month>06</month><year>2025</year></date>
<date date-type="accepted"><day>29</day><month>07</month><year>2025</year></date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2025 Cordeiro, Cathain, Nascimento and Rodrigues.</copyright-statement>
<copyright-year>2025</copyright-year><copyright-holder>Cordeiro, Cathain, Nascimento and Rodrigues</copyright-holder><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><sec><title>Introduction</title>
<p>Gait stability assessment in older adults is challenged by limited data availability and measurement complexity, particularly among vulnerable populations and in limited resource settings. We address three research questions: (1) can synthetic data accurately replicate the statistical properties of gait parameters in older adults? (2) how effectively do synthetic data-trained models predict the Margin of Stability (MoS) when tested on real-world data? and (3) what specific biomechanical features contribute most significantly to the MoS predictions in older adults? To address these challenges, the present study proposes a novel approach to gait stability prediction by integrating computer vision with a data-centric synthetic data generation (SDG) approach using accessible, low-cost technology.</p>
</sec><sec><title>Methods</title>
<p>Using a public dataset from 14 healthy older adults (86.7&#x2009;&#x00B1;&#x2009;6.2 years), we implemented a constraint-based SDG methodology that preserved biomechanical relationships through SDG metadata configuration and rank correlation-based constraints. Gait analysis was performed through a smartphone (Motorola Moto G5 Play) and the open-source MediaPipe algorithm to extract body landmarks from frontal plane gait videos, making the approach suitable for resource-limited settings.</p>
</sec><sec><title>Results</title>
<p>Our approach achieved exceptional fidelity (97.09&#x0025; overall) and maintained biomechanical variable relationships. The model trained exclusively on synthetic data (TSTR) outperformed the model trained on real data (TRTR), with error reductions (RMSE decreased by 56.3&#x0025;, MAE by 58.2&#x0025;, and MSE by 80.9&#x0025;) and improved variance explanation (<italic>R</italic><sup>2</sup> increase of 31.2&#x0025;). SHAP analysis revealed that the synthetic data approach enhanced feature attribution alignment with established principles, particularly for step width, BMI, and fall history.</p>
</sec><sec><title>Discussion</title>
<p>Therefore, our results show that: (1) synthetic data accurately replicated gait parameters with high fidelity; (2) synthetic data-trained models outperformed real data-trained models in MoS prediction; and (3) step width, BMI, and fall history were the most significant predictors of MoS in older adults. These findings demonstrate the potential of synthetic biomechanical time series to overcome data scarcity, improve predictive modeling capabilities, and enhance clinical gait assessment through accessible, low-cost computer vision methods.</p>
</sec>
</abstract>
<kwd-group>
<kwd>synthetic data</kwd>
<kwd>gait stability</kwd>
<kwd>computer vision</kwd>
<kwd>SHAP values</kwd>
<kwd>MediaPipe pose estimation</kwd>
</kwd-group><contract-sponsor id="cn001">Technological University of the Shannon (TUS) President&#x2019;s Doctoral Scholarship 2021</contract-sponsor><counts>
<fig-count count="5"/>
<table-count count="9"/><equation-count count="24"/><ref-count count="59"/><page-count count="15"/><word-count count="0"/></counts><custom-meta-wrap><custom-meta><meta-name>section-at-acceptance</meta-name><meta-value>Biomechanics and Control of Human Movement</meta-value></custom-meta></custom-meta-wrap>
</article-meta>
</front>
<body><sec id="s1" sec-type="intro"><label>1</label><title>Introduction</title>
<p>Human walking is a method of locomotion involving the use of the two legs alternately to provide support and propulsion by at least one foot throughout the gait cycle (<xref ref-type="bibr" rid="B1">1</xref>). Consequently, gait is an individual trait in healthy subjects that can be used for personal identification (<xref ref-type="bibr" rid="B2">2</xref>). However, it changes with age (<xref ref-type="bibr" rid="B3">3</xref>, <xref ref-type="bibr" rid="B4">4</xref>) and can be transformed by emotions (<xref ref-type="bibr" rid="B5">5</xref>), exercise-related or cognitive fatigue (<xref ref-type="bibr" rid="B6">6</xref>), or environmental factors (<xref ref-type="bibr" rid="B7">7</xref>). Assessing gait stability is particularly important in older adults, where impairments in walking can affect both independence and quality of life. Gait stability, pragmatically defined as the ability to walk without falling despite perturbations (<xref ref-type="bibr" rid="B8">8</xref>), is essential for maintaining active living. Therefore, various methods have been developed to assess gait stability, given that neuromuscular conditions and physical impairments can compromise balance control and lead to increased fall risk (<xref ref-type="bibr" rid="B9">9</xref>).</p>
<p>The consequences of mobility loss are severe for older adults. By age 70, approximately one-third report mobility restrictions, increasing to the majority by age 80. These limitations are linked to age-related declines in muscle strength, oxygen consumption, and sensory function, which collectively impair balance control and increase the risk of instability and falls (<xref ref-type="bibr" rid="B10">10</xref>&#x2013;<xref ref-type="bibr" rid="B12">12</xref>). Early identification of gait abnormalities and effective quantification of stability in many clinical populations has gained significant interest as increased knowledge of balance deficits or compensatory strategies may aid rehabilitation and inform therapeutic interventions to improve quality of life and functional capacity (<xref ref-type="bibr" rid="B11">11</xref>).</p>
<p>As described in (<xref ref-type="bibr" rid="B13">13</xref>), gait stability assessment relies on biomechanical principles investigated at the center of mass (CoM), the weighted average of a body&#x0027;s mass. During walking, stability depends on two factors: (1) the position of the CoM relative to the base of support (BoS), which determines whether the body is within stable limits, and (2) CoM velocity, which creates momentum that must be controlled through corrective forces to maintain balance. The extrapolated center of mass (XCoM) extends the CoM concept by incorporating its velocity scaled by a person-specific constant, enabling stability predictions during motion. This stability analysis can be quantified using the margin of stability (MoS), defined as the signed distance between the XCoM and the BoS (<xref ref-type="bibr" rid="B13">13</xref>). This MoS serves as the prediction target for our machine-learning models.</p>
<p>However, gait-related assessment in older adults can face relevant challenges, including limited data availability, measurement complexity, and resource constraints due to a diverse set of problems, such as mobility constraints, cognitive impairments, variability in functional capacity, inconsistent adherence to assessment protocols, and the heterogeneity of age-related gait patterns (<xref ref-type="bibr" rid="B10">10</xref>&#x2013;<xref ref-type="bibr" rid="B12">12</xref>). The integration of synthetic data generation (SDG) techniques has emerged as a promising approach to improve the accuracy and robustness of gait pattern modeling (<xref ref-type="bibr" rid="B14">14</xref>, <xref ref-type="bibr" rid="B15">15</xref>). Researchers can address data scarcity, privacy concerns, and data quality challenges by generating synthetic data that replicates real-world statistical properties, enabling the training of more accurate machine learning models (<xref ref-type="bibr" rid="B16">16</xref>&#x2013;<xref ref-type="bibr" rid="B19">19</xref>). Traditional synthetic data approaches emphasize fidelity, ensuring that synthetic data statistically resembles real-world data through distribution matching. Nevertheless, this singular focus might be insufficient for biomechanical applications because synthetic data with specific quality deficiencies can reduce predictive performance and distort model selection processes, compromising research integrity (<xref ref-type="bibr" rid="B20">20</xref>&#x2013;<xref ref-type="bibr" rid="B24">24</xref>). Despite these challenges, there remains limited research on applying synthetic data generation to gait stability-related parameters, particularly those captured using computer vision-based methods. This research gap is significant given the SDGs&#x2019; potential benefits for augmenting gait datasets, improving model generalization across diverse populations and walking conditions, enabling more prediction-based stability assessment tools, and uncovering valuable information hidden within biomechanical data.</p>
<p>Based on the identified research gaps in applying SDG to gait stability, this study addresses three research questions: (1) Can synthetic data accurately replicate the statistical properties of gait parameters in older adults? (2) How effectively do synthetic data-trained models predict MoS when tested on real-world data? (3) What specific biomechanical features contribute most significantly to the MoS predictions in older adults? We hypothesise that synthetic data generated with biomechanical constraints will enhance machine learning model performance for MoS prediction in older adults beyond that achievable with real-world data alone.</p>
<p>We adopt a dual-evaluation approach, assessing both statistical resemblance and utility, which represents a necessary shift beyond conventional statistical metrics (such as Maximum Mean Discrepancy or Kullback-Leibler divergence) towards a comprehensive data-centric approach (<xref ref-type="bibr" rid="B20">20</xref>). In this context, data utility measures how effectively synthetic data enhances downstream applications when validated against real-world data, particularly regarding model generalization and predictive accuracy. This dual-metric evaluation framework ensures that synthetic data serves two important functions: (1) representing the statistical properties of original data, and (2) providing practical utility through comparative performance metrics when models trained on synthetic data are evaluated against real-world data (TSTR paradigm). By adopting a data-centric perspective, our SDG process aims to maintain biomechanical validity while addressing challenges in gait analysis, including limited sample sizes, inter-subject variability, and requirements for model generalization across the older adult population. Thereby, the synthesizer aims to generate sequential data (Centre of Mass position, CoM velocity, Margin of Stability) and static attributes (Age, Body Mass Index, Fall incidence history), with all synthetic samples undergoing comprehensive quality assessment to ensure biomechanical plausibility and effective dataset augmentation.</p>
<p>In summary, this paper assesses gait stability using metrics calculated from body landmark tracking via computer vision (<xref ref-type="bibr" rid="B25">25</xref>). We apply this approach to frontal plane video footage of healthy older adults (aged &#x003E;65 years) during self-paced walking, employing synthetic data generation to enhance model training. For prediction, we employ Extreme Gradient Boosting (XGBoost) (<xref ref-type="bibr" rid="B26">26</xref>), selected for its capability to handle biomechanical data with complex, non-linear relationships. Model interpretability is enhanced through Shapley Additive Explanations (SHAP) values, which elucidate the contribution of each feature to the MoS predictions (<xref ref-type="bibr" rid="B27">27</xref>).</p>
</sec>
<sec id="s2" sec-type="methods"><label>2</label><title>Methods</title>
<sec id="s2a"><label>2.1</label><title>Data source and participants</title>
<p>In data collection, we used a publicly available dataset (<xref ref-type="bibr" rid="B28">28</xref>) that was subsequently processed using the MediaPipe algorithm (see <xref ref-type="fig" rid="F1">Figure&#x00A0;1</xref>). The dataset comprised 14 healthy older adults residing in a retirement home (11 female, 3 male participants). The participants&#x2019; mean (&#x00B1;standard deviation) age, height, and mass were 86.7&#x2009;&#x00B1;&#x2009;6.2 years, 165.6&#x2009;&#x00B1;&#x2009;9.9&#x2005;cm, and 64.0&#x2009;&#x00B1;&#x2009;12.5&#x2005;kg, respectively. Each participant performed a standardized walking protocol, moving back and forth for one minute along a flat, 13&#x2005;m pathway within a large room.</p>
<fig id="F1" position="float"><label>Figure 1</label>
<caption><p>The flowchart of our methodology.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1646146-g001.tif"><alt-text content-type="machine-generated">Flowchart of a video gait dataset analysis using the MediaPipe Pose algorithm. It calculates gait parameters like center of mass, velocity, and step width followed by signal processing techniques and data-centric synthetic data generation. Machine learning implementation involves XGBoost regressor with hyperparameter optimization, validated through quality assessment. Two-phase evaluation consists of real data training and synthetic data testing, with performance metrics and SHAP analysis.</alt-text>
</graphic>
</fig>
<p>The walking sessions were recorded using two Motorola Moto G5 Play cell phones (Motorola, Chicago, IL), each with a 13-megapixel rear camera capturing high-definition 1080p video at 30 frames per second. Frontal plane recordings (positioned at 111 centimeters height, designated as &#x201C;bottom&#x201D; in the file naming convention) were used for gait analysis.</p>
<p>Accompanying the frontal plane video recordings, the dataset included participant metadata with demographic information and clinical test scores. Based on that, we acknowledge that gait analysis commonly requires multi-view perspectives or 3D motion capture systems. However, we selected frontal plane analysis as it enables assessment of medio-lateral stability parameters relevant for this specific evaluation in older adults and aligns with our focus on low-cost computer vision methods in resource-constrained clinical settings.</p>
<p>Despite the limited sample size (<italic>n</italic>&#x2009;&#x003D;&#x2009;14), this dataset is suitable for our research because it provides standardized gait data from a homogeneous population of older adults collected using a smartphone camera in a controlled setting. This smartphone-based recording facilitates reliable biomechanical measurements whilst addressing realistic challenges of data scarcity and equipment limitations commonly encountered in clinical practice.</p>
<sec id="s2a1"><label>2.1.1</label><title>Computer vision and the MediaPipe pose approach</title>
<p>With the advancement of computer vision techniques, markerless gait analysis has become possible through video footage using pose estimation models such as BlazePose (<xref ref-type="bibr" rid="B29">29</xref>). These techniques involve using computer vision and machine learning (ML) algorithms to extract human poses and track the movement of the body&#x0027;s anatomical landmarks in 2D or 3D spaces over time.</p>
<p>MediaPipe Pose (MPP), an open-source, cross-platform framework provided by Google, captures 2D human joint coordinates in each image frame, consisting of three pre-trained detection models: EfficientDet-Lite0, EfficientDet-Lite2, and the Single Shot Detector (SSD) MobileNetV2 Model trained on the COCO image dataset (<xref ref-type="bibr" rid="B30">30</xref>). MPP uses BlazePose (<xref ref-type="bibr" rid="B29">29</xref>), a lightweight ML architecture that performs quickly on mobile phones and PCs with CPU inference, extracting thirty-three 2D landmarks on the human body, as shown in <xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref>. Moreover, studies have demonstrated MediaPipe&#x0027;s feasibility against gold-standard motion capture systems for the measurement of angular variation for biomechanical evaluation (<xref ref-type="bibr" rid="B31">31</xref>), and for tracking gait parameters in the frontal plane with low mean absolute error (0.04&#x2013;0.18&#x2005;s) (<xref ref-type="bibr" rid="B32">32</xref>). <xref ref-type="fig" rid="F2">Figure&#x00A0;2</xref> illustrates the full set of MediaPipe Pose landmarks available for analysis. We used specific subsets of these landmarks for our gait stability calculations, as detailed in <xref ref-type="table" rid="T1">Table&#x00A0;1</xref>.</p>
<fig id="F2" position="float"><label>Figure 2</label>
<caption><p>Mediapipe pose landmarks (<xref ref-type="bibr" rid="B59">59</xref>).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1646146-g002.tif"><alt-text content-type="machine-generated">Diagram of a human figure with numbered points indicating key body parts for pose estimation. The points are connected with lines, and a list on the right describes each numbered point, such as the nose, eyes, mouth, shoulders, elbows, wrists, hips, knees, ankles, and specific fingers.</alt-text>
</graphic>
</fig>
<table-wrap id="T1" position="float"><label>Table 1</label>
<caption><p>Landmark coordinates required for kinematic measurements.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Calculation purpose</th>
<th valign="top" align="center">Landmarks used</th>
<th valign="top" align="center">Landmark numbers</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Center of Mass (CoM)</td>
<td valign="top" align="left">Nose, Left/Right eyes (inner &#x0026; outer), Shoulders, Hips, Elbows, Wrists, Knees, Ankles</td>
<td valign="top" align="left">0, 1, 2, 3, 4, 11, 12, 13, 14, 15, 16, 23, 24, 25, 26, 27, 28</td>
</tr>
<tr>
<td valign="top" align="left">Extrapolated Center of Mass (XCoM)</td>
<td valign="top" align="left">Left and Right Hips</td>
<td valign="top" align="left">23, 24</td>
</tr>
<tr>
<td valign="top" align="left">Step Width</td>
<td valign="top" align="left">Left and Right Ankles</td>
<td valign="top" align="left">27, 28</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Several metrics were derived from the integration of MPP and the dataset itself, as outlined in <xref ref-type="table" rid="T2">Table&#x00A0;2</xref>. However, before that, to accurately calculate stability metrics such as the MoS, we included each participant&#x0027;s height and weight directly within the <italic>MediaPipe</italic> processing code for each video sequence, allowing the algorithm to generate stability metrics that account for individual anthropometric differences in COM displacement calculations across participants.</p>
<table-wrap id="T2" position="float"><label>Table 2</label>
<caption><p>Gait metrics and their origin and application.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Metric</th>
<th valign="top" align="center">Origin and application</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">COM<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="left">We calculated the COM for each frame based on key body landmarks. Segmental COM values were weighted according to their proportional contribution to the total body weight, and a combined COM was computed.</td>
</tr>
<tr>
<td valign="top" align="left">Velocity of COM</td>
<td valign="top" align="left">By analyzing the COM&#x0027;s movement between frames, we calculated the velocity based on the frame acquisition rate, a crucial input for stability-related measures.</td>
</tr>
<tr>
<td valign="top" align="left">XCoM<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="left">We computed using COM velocity and position data to provide an adjusted measure of stability for each frame.</td>
</tr>
<tr>
<td valign="top" align="left">MoS<xref ref-type="table-fn" rid="table-fn1"><sup>a</sup></xref></td>
<td valign="top" align="left">We determined it by calculating the distance between XCoM and the base of support, formed by the left and right ankles, for each frame. This quantifies stability dynamically as the participant moves.</td>
</tr>
<tr>
<td valign="top" align="left">Step Width</td>
<td valign="top" align="left">By analyzing ankle positions, we calculated the step width for each frame, which provides information about gait stability and variability.</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn1"><label><sup>a</sup></label>
<p>COM, center of mass; XCoM, extrapolated center of mass; MoS, margin of stability.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>As described in (<xref ref-type="bibr" rid="B13">13</xref>), one limitation in the estimation of MoS is the assumption of instantaneous adjustments in the center of pressure (CoP). CoP adjustments are constrained by the finite reaction time required for muscle activation. While this limitation has been explored in standing balance, it still needs to be investigated for walking dynamics. Although our <italic>Mediapipe&#x0027;s</italic> pose extraction works to capture gait dynamics, it has not fully addressed this previous limitation.</p>
<p>These are the formulas used to calculate these metrics. First, to calculate the COM for body segments, we used <xref ref-type="disp-formula" rid="disp-formula1">Equation&#x00A0;1</xref>:<disp-formula id="disp-formula1"><label>(1)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM1"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">M</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">segment</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow><mml:munderover><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mspace width="0.2em"/><mml:msub><mml:mi>p</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>Where <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM1"><mml:msub><mml:mi>p</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:math></inline-formula> represented the position vector of the <italic>i</italic> -th landmark within the segment (with x and y coordinates from the 2D video plane), and <italic>n</italic> is the total number of landmarks in the segment. While MediaPipe provided estimated z-coordinates, our analysis used the frontal plane (x,y) coordinates for consistency with our 2D video capture methodology.</p>
<p>The COM for the entire body is then calculated as a weighted sum of each segment&#x0027;s COM using anthropometric segment weight coefficients that represent each body segment&#x0027;s proportional mass relative to total body weight (<xref ref-type="disp-formula" rid="disp-formula2">Equation&#x00A0;2</xref>). These coefficients were: head (8.1&#x0025;), torso (49.7&#x0025;), arms (2.65&#x0025; each), and legs (16.1&#x0025; each), based on established anthropometry (<xref ref-type="bibr" rid="B33">33</xref>).<disp-formula id="disp-formula2"><label>(2)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM2"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">M</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">body</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:msubsup><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mspace width=".1em"/><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:msubsup><mml:mspace width="0.2em"/><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">M</mml:mi></mml:mrow><mml:mi>j</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mspace width=".1em"/><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>m</mml:mi></mml:msubsup><mml:mspace width="0.2em"/><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>Where <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM2"><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">M</mml:mi></mml:mrow><mml:mi>j</mml:mi></mml:msub></mml:math></inline-formula> is the COM of the <italic>j</italic> -th body segment, <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM3"><mml:mspace width="0.25em"/><mml:msub><mml:mi>w</mml:mi><mml:mi>j</mml:mi></mml:msub></mml:math></inline-formula> is the weight coefficient of that segment as a proportion of total body weight, and <italic>m</italic> is the total number of body segments considered.</p>
<p>The velocity of the CoM is derived from the difference between successive CoM positions over time (<xref ref-type="disp-formula" rid="disp-formula3">Equation&#x00A0;3</xref>):<disp-formula id="disp-formula3"><label>(3)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM3"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">COM</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>t</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mi>f</mml:mi><mml:mo>&#x22C5;</mml:mo><mml:mo stretchy="false">[</mml:mo><mml:mrow><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">M</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">body</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mi>t</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>&#x2212;</mml:mo><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">M</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">body</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo stretchy="false">]</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>Where <italic>f</italic> is the sampling frequency in frames per second and <italic>t</italic> represents the frame index.</p>
<p>Additionally, the XCoM is calculated as an extrapolation of the CoM based on its velocity, helping to determine stability (<xref ref-type="disp-formula" rid="disp-formula4">Equation&#x00A0;4</xref>):<disp-formula id="disp-formula4"><label>(4)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM4"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:mrow><mml:mi mathvariant="normal">XCoM</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mi mathvariant="normal">CO</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">M</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">body</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">COM</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi>&#x03C9;</mml:mi><mml:mn>0</mml:mn></mml:msub></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>Where <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM4"><mml:msub><mml:mi>&#x03C9;</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:mfrac><mml:mi>g</mml:mi><mml:mi>l</mml:mi></mml:mfrac></mml:mrow></mml:msqrt></mml:math></inline-formula> is the eigenfrequency of the inverted pendulum, with <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM5"><mml:mi>g</mml:mi><mml:mo>=</mml:mo><mml:mn>9.81</mml:mn><mml:mrow><mml:mspace width="0.25em"/><mml:mi mathvariant="normal">m</mml:mi><mml:mo>/</mml:mo></mml:mrow><mml:msup><mml:mrow><mml:mi mathvariant="normal">s</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:math></inline-formula> as gravitational acceleration and <italic>l</italic> l as the leg length. In our implementation, the leg length is computed as a fraction of the distance between the CoM and the midpoint of the ankles.</p>
<p>Moreover, we measured the MoS by evaluating the distances of the XCoM and CoM from the edge of the support base formed by the feet (<xref ref-type="disp-formula" rid="disp-formula5">Equation&#x00A0;5</xref>):<disp-formula id="disp-formula5"><label>(5)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM5"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:mrow><mml:mi mathvariant="normal">MoS</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mo movablelimits="true" form="prefix">min</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mi>d</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">XCoM</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>d</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">COM</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>Where <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM6"><mml:msub><mml:mi>d</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">XCoM</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:math></inline-formula> and <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM7"><mml:msub><mml:mi>d</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">COM</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:math></inline-formula> represent the perpendicular distances from XCoM and CoM to the boundary of the base of support, calculated using <xref ref-type="disp-formula" rid="disp-formula6">Equations&#x00A0;6</xref>, <xref ref-type="disp-formula" rid="disp-formula7">7</xref>:<disp-formula id="disp-formula6"><label>(6)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM6"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mi>d</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">XCoM</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">XCoM</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>&#x00D7;</mml:mo><mml:msub><mml:mi>v</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">boundary</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo></mml:mrow><mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">boundary</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula><disp-formula id="disp-formula7"><label>(7)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM7"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mi>d</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">COM</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">COM</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>&#x00D7;</mml:mo><mml:msub><mml:mi>v</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">boundary</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo></mml:mrow><mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo><mml:mrow><mml:msub><mml:mi>v</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">boundary</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>Finally, the step width between the left and right ankles is computed (<xref ref-type="disp-formula" rid="disp-formula8">Equation&#x00A0;8</xref>):<disp-formula id="disp-formula8"><label>(8)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM8"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:mrow><mml:mi mathvariant="normal">StepWidth</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo><mml:mrow><mml:msub><mml:mi>r</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">lef</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">t</mml:mi></mml:mrow><mml:mrow><mml:mi>x</mml:mi><mml:mi>y</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>r</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">righ</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">t</mml:mi></mml:mrow><mml:mrow><mml:mi>x</mml:mi><mml:mi>y</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow><mml:mo fence="false" stretchy="false">&#x2016;</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>Where <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM8"><mml:msub><mml:mi>r</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">lef</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">t</mml:mi></mml:mrow><mml:mrow><mml:mi>x</mml:mi><mml:mi>y</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:math></inline-formula> and <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM9"><mml:msub><mml:mi>r</mml:mi><mml:mrow><mml:mrow><mml:mi mathvariant="normal">righ</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="normal">t</mml:mi></mml:mrow><mml:mrow><mml:mi>x</mml:mi><mml:mi>y</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:math></inline-formula> represent the left and right ankle joint centers&#x2019; two-dimensional projections onto the frontal (xy) plane. Based on these tools, integrating datasets with MediaPipe&#x0027;s data extraction capabilities enabled us to capture metrics across the individuals&#x2019; walking sequences.</p>
</sec>
</sec>
<sec id="s2b"><label>2.2</label><title>Data preprocessing</title>
<p>Data preprocessing is the subsequent step to ensure the quality and reliability of the analysis. This was conducted using Python&#x0027;s Pandas (version 2.2) (<xref ref-type="bibr" rid="B34">34</xref>) and Scipy (version 1.13.1) (<xref ref-type="bibr" rid="B35">35</xref>) libraries following a structured sequence of operations as detailed below.</p>
<p>To reduce the noise and variability in the raw data, a fourth-order Butterworth low-pass filter was applied (<xref ref-type="bibr" rid="B36">36</xref>). The filter&#x0027;s cutoff frequency was set to 4&#x2005;Hz, commonly used in gait analysis to retain relevant gait dynamics while attenuating high-frequency noise (<xref ref-type="bibr" rid="B36">36</xref>). This filtering step smoothed the data and aimed to improve the accuracy of subsequent calculations.</p>
<p>We applied this filter independently to each landmark&#x0027;s x and y coordinates, ensuring zero-phase distortion and minimal signal delay. After filtering, the gait parameters (CoM, Step Width, MoS) were recalculated using the filtered landmark positions. This ensured that all subsequent analysis was based on refined trajectory data.</p>
<p>During video processing, the pose estimation algorithm can occasionally lose track of participants, particularly during rapid movements. These occasions result in missing data points for specific frames. To address this challenge, a mean imputation technique was employed using information from the previous and subsequent frames within the same walking sequence, maintaining the continuity of the movement trajectory. Also, we ensured that the data collection did not provide a number of missing values extremely high, i.e., greater than 20&#x0025; of the total number of frames in one gait cycle, as suggested by (<xref ref-type="bibr" rid="B37">37</xref>).</p>
<p>We detected and removed outliers to maintain the integrity of the dataset. We implemented a statistical approach based on each variable&#x0027;s mean and standard deviation. First, the mean (&#x03BC;) and standard deviation (&#x03C3;) were calculated for each sequential parameter. A data point was classified as an outlier if it fell outside the interval &#x03BC;&#x2009;&#x00B1;&#x2009;k&#x00B7;&#x03C3;, where k is a threshold factor. We selected k&#x2009;&#x003D;&#x2009;2 for our analysis, identifying values more than two standard deviations from the mean as outliers. This approach is a standard data preprocessing technique widely used in signal processing and anomaly detection (<xref ref-type="bibr" rid="B38">38</xref>). The two-standard-deviation threshold retains approximately 95&#x0025; of the data, preserving the majority of valid observations and eliminating extreme values that could distort subsequent analyses.</p>
<p>The final preprocessing step involved normalizing the input variables introduced into the machine learning model on the TRTR (Training on real data, testing on real data) process. On TSTR (Training on synthetic data, testing on real data), we had one more of the same normalization approach after the SDG implementation, focusing on applying the normalized data to the Machine Learning (ML) model. Thereby, we applied <italic>Min</italic>&#x2013;<italic>Max</italic> scaling, transforming each feature to a range between 0 and 1. This normalization ensures that features with different units and ranges contribute equally to the model without bias toward variables with larger numerical scales (<xref ref-type="bibr" rid="B39">39</xref>).</p>
</sec>
<sec id="s2c"><label>2.3</label><title>Synthetic data generation (SDG)</title>
<p>This research employed a data-centric approach to SDG for biomechanically-based time series data. The methodology centered on preserving specific biomechanical relationships while generating statistically representative synthetic samples. We employed YData&#x0027;s TimeSeriesSynthesizer [v2.0.0, <italic>ydata-sdk Python</italic> package (<xref ref-type="bibr" rid="B40">40</xref>)] to generate biomechanically constrained synthetic time-series data, configured via hierarchical metadata and correlation-preserving constraints (<xref ref-type="table" rid="T3">Table&#x00A0;3</xref>).</p>
<table-wrap id="T3" position="float"><label>Table 3</label>
<caption><p>Metadata configuration for biomechanical-based time series data.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Metadata component</th>
<th valign="top" align="center">Information provided to synthesizer</th>
<th valign="top" align="center">Utilization in synthesis process</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Temporal structure</td>
<td valign="top" align="left">The sequential organization of biomechanical parameters across time points (Timestamp range: 0.0&#x2013;7.2594)</td>
<td valign="top" align="left">Time-series architectures that preserve autocorrelation structure and temporal contingencies</td>
</tr>
<tr>
<td valign="top" align="left">Feature correlations</td>
<td valign="top" align="left">Multivariate relationship matrix (e.g., Step Width-MoS correlation: 0.768)</td>
<td valign="top" align="left">Multivariate sampling with covariance preservation; rank correlation-based approaches for maintaining interdependencies</td>
</tr>
<tr>
<td valign="top" align="left">Distributional parameters</td>
<td valign="top" align="left">Statistical moments of features, including skewness values</td>
<td valign="top" align="left">Normalizing flows; transformation functions that accurately model tail behaviors and central tendencies</td>
</tr>
<tr>
<td valign="top" align="left">Categorical frequencies</td>
<td valign="top" align="left">Cardinality and class distributions (14 unique participant IDs)</td>
<td valign="top" align="left">Stratified generation processes; conditional sampling with proper class balancing mechanisms</td>
</tr>
<tr>
<td valign="top" align="left">Variables boundaries</td>
<td valign="top" align="left">Domain constraints for biomechanical variables (e.g., Step Width: 0.002&#x2013;0.266&#x2005;m)</td>
<td valign="top" align="left">Constrained optimization; bounded generative functions with domain-appropriate activation mechanisms</td>
</tr>
<tr>
<td valign="top" align="left">Rank correlation-based biomechanical constraint</td>
<td valign="top" align="left">Rank-based correlation thresholds (Step Width-MoS: <italic>&#x03C1;</italic>&#x2009;&#x003E;&#x2009;0.7, Velocity-MoS: <italic>&#x03C1;</italic>&#x2009;&#x003C;&#x2009;&#x2212;0.3) derived from empirical biomechanical relationships</td>
<td valign="top" align="left">Distribution-invariant enforcement of biomechanical principles through rank correlation validation; preservation of stability-support relationships whilst accommodating individual variability</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In the generation process, we incorporated a hierarchical architecture that respected temporal dependencies (stride-to-stride transitions) and entity-specific patterns (participant-level characteristics). Timestamp values were designated as the sequential sorting key, whilst participant identifiers were established as entity boundaries, enabling the synthesizer to capture both within-subject variability and between-subject differences in gait parameters.</p>
<p>We integrated domain-specific biomechanical constraints derived from established principles of locomotor stability. These constraints were designed to maintain relationships between gait parameters, particularly the positive correlation between step width and margin of stability (reflecting increased base of support) (<xref ref-type="bibr" rid="B41">41</xref>) and the inverse relationship between the center of mass velocity and margin of stability (reflecting reduced control at higher speeds) (<xref ref-type="bibr" rid="B42">42</xref>, <xref ref-type="bibr" rid="B43">43</xref>).</p>
<sec id="s2c1"><label>2.3.1</label><title>SDG technique</title>
<p>We used the TimeSeriesSynthesizer framework and implemented additional rank correlation-based dependency constraints to enforce biomechanical relationships in the generated data. The model architecture incorporated the following key components.</p>
<sec id="s2c1a"><label>2.3.1.1</label><title>Metadata configuration</title>
<p>The synthesizer was initialized with time series metadata specifying Timestamp as the temporal sorting key and ID as the entity identifier. This configuration established appropriate boundaries for learning temporal dynamics whilst preserving participant-specific characteristics.</p>
</sec>
<sec id="s2c1b"><label>2.3.1.2</label><title>Rank correlation-based constraint implementation</title>
<p>We developed custom constraint functions that evaluated relationships between biomechanical variables through rank statistics. Specifically, we utilized Spearman rank correlations to enforce relationships between key biomechanical parameters whilst maintaining their individual distributional properties. This approach enabled us to:
<list list-type="simple">
<list-item><label>(1)</label>
<p>Enforce a positive correlation between step width and margin of stability (<italic>&#x03C1;</italic>&#x2009;&#x003E;&#x2009;0.7, reflecting the observed value of 0.768 in the real data correlation matrix).</p></list-item>
<list-item><label>(2)</label>
<p>Maintain the inverse relationship between the center of mass velocity and margin of stability (<italic>&#x03C1;</italic>&#x2009;&#x003C;&#x2009;&#x2212;0.3, capturing the observed value of &#x2212;0.487 in the real data correlation matrix).</p></list-item>
</list>These correlation thresholds were implemented via custom validation functions that verified whether generated data maintained the specified biomechanical relationships. The functions calculated Spearman rank correlations between the relevant variables and validated that they met the predetermined thresholds derived from established biomechanical principles.</p>
</sec>
<sec id="s2c1c"><label>2.3.1.3</label><title>Variables boundary preservation</title>
<p>The synthesizer maintained the derived domains for biomechanical variables, including each variable&#x0027;s minimum and maximum values, such as step width (0.002&#x2013;0.266&#x2005;m) and margin of stability (0.004&#x2013;0.054&#x2005;m).</p>
</sec>
<sec id="s2c1d"><label>2.3.1.4</label><title>Model training and data generation</title>
<p>Finally, we trained the synthesizer using 1,878 timesteps of original data from 14 participants. This constrained model subsequently generated the synthetic dataset with equivalent dimensionality, preserving distributional characteristics and variable relationships.</p>
</sec>
</sec>
</sec>
<sec id="s2d"><label>2.4</label><title>SDG quality process and its assessment</title>
<p>To evaluate the quality of the synthetic data, we implemented an assessment framework addressing data fidelity and utility. This process comprised two components: (1) synthetic data fidelity evaluation and (2) predictive performance assessment through a supervised machine learning model.</p>
<sec id="s2d1"><label>2.4.1</label><title>Synthetic data fidelity metrics</title>
<p>Synthetic data fidelity was assessed through complementary statistical approaches. The <italic>Python</italic> packages used are <italic>SDV (version 1.18.0)</italic> (<xref ref-type="bibr" rid="B44">44</xref>), <italic>SDMetrics (version 0.17.0)</italic> (<xref ref-type="bibr" rid="B45">45</xref>), and <italic>Scipy (version 1.13.1)</italic> (<xref ref-type="bibr" rid="B35">35</xref>).</p>
<sec id="s2d1a"><label>2.4.1.1</label><title>Univariate distribution similarity</title>
<p>We employed the Kolmogorov&#x2013;Smirnov (<xref ref-type="bibr" rid="B46">46</xref>) complement (KSComplement) for continuous variables and the Total Variation complement (TVComplement) for categorical variables. These metrics quantified distribution similarity on a scale from 0 to 1, with higher values indicating greater fidelity (<xref ref-type="bibr" rid="B45">45</xref>). Column shapes were evaluated with an aggregate score across all variables.</p>
</sec>
<sec id="s2d1b"><label>2.4.1.2</label><title>Bivariate relationship preservation</title>
<p>We assessed pairwise variable relationships through correlation pattern analysis, quantifying the degree to which the synthetic data maintained the interrelationships in the original dataset (<xref ref-type="bibr" rid="B45">45</xref>).</p>
</sec>
<sec id="s2d1c"><label>2.4.1.3</label><title>Hellinger distance calculation</title>
<p>We computed Hellinger distances between original and synthetic distributions for each variable and overall. This probabilistic divergence measure (scaled between 0 and 1, with lower values indicating greater similarity) assessed distribution similarity sensitive to location and shape differences (<xref ref-type="bibr" rid="B47">47</xref>).</p>
</sec>
</sec>
<sec id="s2d2"><label>2.4.2</label><title>Machine learning approach</title>
<p>To evaluate the practical utility of the synthetic data, we implemented a supervised machine learning framework using a gradient-boosting regression model trained to predict the margin of stability from gait parameters and participants&#x2019; characteristics.</p>
<sec id="s2d2a"><label>2.4.2.1</label><title>Model architecture</title>
<p>We employed XGBoost regression models, a decision tree-based ensemble ML technique, selected for their capacity to capture non-linear relationships in biomechanical data across various studies (<xref ref-type="bibr" rid="B48">48</xref>&#x2013;<xref ref-type="bibr" rid="B50">50</xref>). The XGBoost minimizes the models&#x2019; residuals and increases the predictive power by combining weak learners (<xref ref-type="bibr" rid="B51">51</xref>). Using XGBoost, we aimed to identify the relationships between biomechanical parameters and the Margin of Stability, thereby establishing a model capable of accurately estimating stability from gait variables.</p>
</sec>
<sec id="s2d2b"><label>2.4.2.2</label><title>Hyperparameter optimization</title>
<p>To maximize predictive performance, we implemented a comprehensive grid search strategy using <italic>sci-kit-learn&#x0027;s GridSearchCV</italic> combined with 5-fold cross-validation. This approach evaluated all possible combinations of the following hyperparameter values for the XGBoost model (<xref ref-type="table" rid="T4">Table&#x00A0;4</xref>). The grid search process evaluated 135 different hyperparameter combinations (3&#x2009;&#x00D7;&#x2009;3&#x2009;&#x00D7;&#x2009;3&#x2009;&#x00D7;&#x2009;2&#x2009;&#x00D7;&#x2009;2), with each combination subjected to 5-fold cross-validation. The optimal configuration was selected to minimize the Mean Absolute Error (MAE) across validation folds.</p>
<table-wrap id="T4" position="float"><label>Table 4</label>
<caption><p>Hyperparameter optimization.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Classifier</th>
<th valign="top" align="center">Hyperparameter</th>
<th valign="top" align="center">Optimized parameter values</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" rowspan="5">Extreme gradient boosting (XGBoost)</td>
<td valign="top" align="left">n_estimators</td>
<td valign="top" align="center">[100, 200, 300]</td>
</tr>
<tr>
<td valign="top" align="left">max_depth</td>
<td valign="top" align="center">[3, 5, 7]</td>
</tr>
<tr>
<td valign="top" align="left">learning_rate</td>
<td valign="top" align="center">[0.01, 0.1, 0.2]</td>
</tr>
<tr>
<td valign="top" align="left">subsample</td>
<td valign="top" align="center">[0.8, 1.0]</td>
</tr>
<tr>
<td valign="top" align="left">colsample_bytree</td>
<td valign="top" align="center">[0.8, 1.0]</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2d2c"><label>2.4.2.3</label><title>Comparative evaluation</title>
<p>Our machine learning implementation followed a two-phase approach to evaluate predictive performance and the utility of our SDG.
<list list-type="simple">
<list-item><label>(1)</label>
<p><italic>Phase 1</italic> &#x2014; We trained the model on real-world gait data using a 70:30 train-test split of the original dataset, so we tested it on the held-out real data. We called it the TRTR (Training on Real, Testing on Real) approach.</p></list-item>
<list-item><label>(2)</label>
<p><italic>Phase 2</italic> &#x2014; We trained the model exclusively on synthetic data and then evaluated its performance by testing on the complete real-world dataset. We called it the TSTR (Training on Synthetic, Testing it on Real) approach.</p></list-item>
</list>This design allowed us to directly assess whether models trained on synthetic data could generalize effectively to real-world observations. We employed XGBoost for both phases to predict the Margin of Stability variable using the input variables listed in <xref ref-type="table" rid="T5">Table&#x00A0;5</xref>.</p>
<table-wrap id="T5" position="float"><label>Table 5</label>
<caption><p>Input and output variables for MoS prediction.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Metric</th>
<th valign="top" align="center">Units</th>
<th valign="top" align="center">Type</th>
<th valign="top" align="center">Description</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">X Coordinate CoM<xref ref-type="table-fn" rid="table-fn2"><sup>a</sup></xref></td>
<td valign="top" align="left">Meters (m)</td>
<td valign="top" align="left">Input (Numeric)</td>
<td valign="top" align="left">X-coordinate of the Center of Mass</td>
</tr>
<tr>
<td valign="top" align="left">Y Coordinate CoM<xref ref-type="table-fn" rid="table-fn2"><sup>a</sup></xref></td>
<td valign="top" align="left">Meters (m)</td>
<td valign="top" align="left">Input (Numeric)</td>
<td valign="top" align="left">Y-coordinate of the Center of Mass</td>
</tr>
<tr>
<td valign="top" align="left">Step width</td>
<td valign="top" align="left">Meters (m)</td>
<td valign="top" align="left">Input (Numeric)</td>
<td valign="top" align="left">Width of the step during gait</td>
</tr>
<tr>
<td valign="top" align="left">CoM_Velocity</td>
<td valign="top" align="left">m/s</td>
<td valign="top" align="left">Input (Numeric)</td>
<td valign="top" align="left">Velocity of the Center of Mass</td>
</tr>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="left">Category</td>
<td valign="top" align="left">Input (Categorical)</td>
<td valign="top" align="left">0: Middle-old (75&#x2013;84), 1: Oldest-old (&#x2265;85)</td>
</tr>
<tr>
<td valign="top" align="left">BMI<xref ref-type="table-fn" rid="table-fn2"><sup>a</sup></xref></td>
<td valign="top" align="left">Category</td>
<td valign="top" align="left">Input (Categorical)</td>
<td valign="top" align="left">0: Underweight (&#x003C;23), 1: Healthy weight (23&#x2013;30)</td>
</tr>
<tr>
<td valign="top" align="left">Fall incidence in the last 6 months (Fall History)</td>
<td valign="top" align="left">Category</td>
<td valign="top" align="left">Input (Categorical)</td>
<td valign="top" align="left">No Falls (0), At Least One Fall (1)</td>
</tr>
<tr>
<td valign="top" align="left">MoS</td>
<td valign="top" align="left">Meters (m)</td>
<td valign="top" align="left">Output (Numeric)</td>
<td valign="top" align="left">Margin of Stability</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn2"><label><sup>a</sup></label>
<p>COM, center of mass; BMI, body mass index.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>In terms of performance assessment, we evaluated model performance using a comprehensive set of metrics to assess prediction accuracy for the MoS output variable (<xref ref-type="table" rid="T5">Table&#x00A0;5</xref>).</p>
<p><italic>Mean Absolute Error (MAE)</italic>. Measures the average absolute difference between predicted values (<inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM10"><mml:msub><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow><mml:mi>i</mml:mi></mml:msub></mml:math></inline-formula>) and actual values (<inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM11"><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:math></inline-formula>) across all <italic>n</italic> observations, often used to deal with the problem of differentiability (see <xref ref-type="disp-formula" rid="disp-formula9">Equation&#x00A0;9</xref>). The lower the value, the better the result. A value of zero indicates a perfect fit.<disp-formula id="disp-formula9"><label>(9)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM9"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:mi>M</mml:mi><mml:mi>A</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow><mml:munderover><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mspace width="0.2em"/><mml:mo fence="false" stretchy="false">|</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mrow><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mi>i</mml:mi></mml:msub><mml:mo fence="false" stretchy="false">|</mml:mo></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula><italic>Mean Squared Error (MSE)</italic>. Quantifies prediction error by calculating the average squared differences between predicted values and actual observations (see <xref ref-type="disp-formula" rid="disp-formula10">Equation&#x00A0;10</xref>). It is used to overcome the problem of differentiability in MAE. The lower the value, the better the result. A value of zero indicates a perfect fit.<disp-formula id="disp-formula10"><label>(10)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM10"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow><mml:munderover><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mspace width="0.2em"/><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mrow><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula><italic>Root Mean Squared Error (RMSE)</italic>. Provides a measure of the average magnitude of prediction errors in the same units as the target variable, facilitating interpretation (see <xref ref-type="disp-formula" rid="disp-formula11">Equation&#x00A0;11</xref>). RMSE is more sensitive to outliers than MAE, but its expression in the original unit of measurement makes it important for this biomechanical application.<disp-formula id="disp-formula11"><label>(11)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM11"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:mi>R</mml:mi><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:msqrt><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac></mml:mrow><mml:munderover><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mspace width="0.2em"/><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mrow><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mstyle></mml:msqrt><mml:mo>=</mml:mo><mml:msqrt><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi></mml:msqrt></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula><italic>Coefficient of Determination (R&#x00B2; score)</italic>. Indicates the proportion of variance in the target variable that is predictable from the independent variables. Its values range from 0 to 1, indicating no fit and fit. The higher the value, the better the result, which means the closer the R2 value is to 1, the better the model is fitted. <italic>R</italic><sup>2</sup> is calculated as 1 minus the ratio of the sum of squared errors (SSE) to the total sum of squares (SST), where <inline-formula><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="IM12"><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x00AF;</mml:mo></mml:mover></mml:mrow></mml:math></inline-formula> represents the mean of the observed values (see <xref ref-type="disp-formula" rid="disp-formula12">Equation&#x00A0;12</xref>).<disp-formula id="disp-formula12"><label>(12)</label><mml:math xmlns:mml="http://www.w3.org/1998/Math/MathML" id="DM12"><mml:mtable rowspacing="4pt" columnspacing="1em"><mml:mtr><mml:mtd><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:msubsup><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:mspace width="0.2em"/><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mrow><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x005E;</mml:mo></mml:mover></mml:mrow></mml:mrow><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mo movablelimits="false">&#x2211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:mspace width="0.2em"/><mml:msup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:mrow><mml:mover><mml:mi>y</mml:mi><mml:mo stretchy="false">&#x00AF;</mml:mo></mml:mover></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac></mml:mrow><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mfrac><mml:mrow><mml:mi>S</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi></mml:mrow><mml:mrow><mml:mi>S</mml:mi><mml:mi>S</mml:mi><mml:mi>T</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mstyle></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>These metrics allowed for a thorough comparison between our two phases, providing insight into the utility of synthetic data for MoS prediction. Additionally, they are widely recognized as reliable measures for evaluating gait parameter predictions (<xref ref-type="bibr" rid="B52">52</xref>, <xref ref-type="bibr" rid="B53">53</xref>).</p>
</sec>
<sec id="s2d2d"><label>2.4.2.4</label><title>Model interpretability</title>
<p>To understand feature contributions and enhance model transparency, we implemented Shapley Additive Explanations (SHAP) (<xref ref-type="bibr" rid="B27">27</xref>). For our XGBoost model, we used the SHAP Tree Explainer, which efficiently calculates contribution values for each feature input.</p>
<p>The SHAP analysis identified the biomechanical variables with the greatest influence on MoS predictions and enabled comparisons of feature importance patterns between models trained on real or synthetic data. This interpretability framework was essential for validating that synthetic data preserved the relationships present in the original dataset and respected well-established gait parameters principles, especially for older adults&#x2019; gait. However, this model interpretability tool can face challenges, including computational intensity for large datasets and sensitivity to noise (<xref ref-type="bibr" rid="B54">54</xref>).</p>
</sec>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results"><label>3</label><title>Results</title>
<p>The following subsections detail the results of the experiments conducted.</p>
<sec id="s3a"><label>3.1</label><title>Synthetic data fidelity analysis</title>
<sec id="s3a1"><label>3.1.1</label><title>Overall fidelity metrics</title>
<p>The synthetic data demonstrated exceptional fidelity across multiple evaluation dimensions.</p>
<p>These metrics indicate that the metadata parameters used in this approach produced synthetic data that closely mirrors the statistical properties of the original dataset while maintaining these variables&#x2019; relationships (<xref ref-type="table" rid="T6">Table&#x00A0;6</xref>).</p>
<table-wrap id="T6" position="float"><label>Table 6</label>
<caption><p>Overall synthetic data fidelity assessment.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Evaluation metric</th>
<th valign="top" align="center">Score</th>
<th valign="top" align="center">Interpretation</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Column shapes</td>
<td valign="top" align="center">98.51&#x0025;</td>
<td valign="top" align="left">Near-perfect preservation of univariate distributions</td>
</tr>
<tr>
<td valign="top" align="left">Column pair trends</td>
<td valign="top" align="center">95.67&#x0025;</td>
<td valign="top" align="left">Excellent maintenance of bivariate relationships</td>
</tr>
<tr>
<td valign="top" align="left">Overall fidelity</td>
<td valign="top" align="center">97.09&#x0025;</td>
<td valign="top" align="left">Very high overall synthetic data quality</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3a2"><label>3.1.2</label><title>Distribution similarity analysis</title>
<p>The Kolmogorov&#x2013;Smirnov complement (KSComplement) and Total Variation complement (TVComplement) scores for individual variables demonstrated exceptional preservation of univariate distributions (<xref ref-type="table" rid="T7">Table&#x00A0;7</xref>).</p>
<table-wrap id="T7" position="float"><label>Table 7</label>
<caption><p>Distribution similarity metrics by variable.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Variable</th>
<th valign="top" align="center">Metric</th>
<th valign="top" align="center">Score</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">CoM X coordinate</td>
<td valign="top" align="left">KSComplement</td>
<td valign="top" align="center">0.978</td>
</tr>
<tr>
<td valign="top" align="left">CoM Y coordinate</td>
<td valign="top" align="left">KSComplement</td>
<td valign="top" align="center">0.977</td>
</tr>
<tr>
<td valign="top" align="left">Step Width</td>
<td valign="top" align="left">KSComplement</td>
<td valign="top" align="center">0.978</td>
</tr>
<tr>
<td valign="top" align="left">Margin of stability</td>
<td valign="top" align="left">KSComplement</td>
<td valign="top" align="center">0.979</td>
</tr>
<tr>
<td valign="top" align="left">Timestamp</td>
<td valign="top" align="left">KSComplement</td>
<td valign="top" align="center">1.00</td>
</tr>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="left">TVComplement</td>
<td valign="top" align="center">0.990</td>
</tr>
<tr>
<td valign="top" align="left">Fall history</td>
<td valign="top" align="left">TVComplement</td>
<td valign="top" align="center">1.00</td>
</tr>
<tr>
<td valign="top" align="left">BMI</td>
<td valign="top" align="left">TVComplement</td>
<td valign="top" align="center">0.986</td>
</tr>
<tr>
<td valign="top" align="left">CoM velocity</td>
<td valign="top" align="left">KSComplement</td>
<td valign="top" align="center">0.974</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>All variables exhibited scores above 0.97, with categorical variables (e.g., Fall History) achieving perfect preservation (1.0). This demonstrates that the synthetic data maintained the distributional characteristics of all gait parameters, which is visually confirmed in <xref ref-type="fig" rid="F3">Figure&#x00A0;3</xref>, with a high degree of overlap between the real and synthetic distributions.</p>
<fig id="F3" position="float"><label>Figure 3</label>
<caption><p>Distribution comparison between original and synthetic data. Each subplot shows its data distribution, synthetic data (blue color), and real data (gray color). Additionally, the KS Complement is introduced at the top right of each subplot to demonstrate each variable&#x0027;s fidelity performance.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1646146-g003.tif"><alt-text content-type="machine-generated">Nine probability density plots compare real and synthetic datasets across various metrics: CoM X and Y coordinates, step width, margin of stability, timestamp, age, fall history, BMI, and CoM velocity. Synthetic data is shown in teal and real data in black, with Kolmogorov-Smirnov (KS) statistics included for each plot, showing high similarity.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3a3"><label>3.1.3</label><title>Probabilistic divergence assessment</title>
<p>The overall Hellinger Distance (HD)&#x2009;&#x003D;&#x2009;0.0193 indicated excellent alignment between the original and synthetic distributions. Specifically, the biomechanical variables at the core of our rank correlation-based constraints &#x2014; Step Width (HD&#x2009;&#x003D;&#x2009;0.0333), MoS (HD&#x2009;&#x003D;&#x2009;0.0332), and CoM Velocity (HD&#x2009;&#x003D;&#x2009;0.0447), retained low divergence despite the constraint enforcement.</p>
</sec>
</sec>
<sec id="s3b"><label>3.2</label><title>Performance metrics comparison</title>
<p>The synthetic data-based model (TSTR) demonstrated superior predictive performance compared to the real-data-only approach, with error metrics reduced by 56&#x0025;&#x2013;81&#x0025; and variance explanation (<italic>R</italic><sup>2</sup>) improved by 31.2&#x0025; (<xref ref-type="table" rid="T8">Table&#x00A0;8</xref>). This finding suggested that this approach may attenuate random variability and preserve its variable relationships, enhancing the model&#x0027;s ability to capture patterns in these gait parameters.</p>
<table-wrap id="T8" position="float"><label>Table 8</label>
<caption><p>Performance comparison between the model performance on &#x201C;TRTR and TSTR-based&#x201D; approaches.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Performance metric</th>
<th valign="top" align="center">TRTR<xref ref-type="table-fn" rid="table-fn3"><sup>a</sup></xref></th>
<th valign="top" align="center">TSTR<xref ref-type="table-fn" rid="table-fn3"><sup>a</sup></xref></th>
<th valign="top" align="center"><italic>&#x0394;</italic>&#x2014;improvement</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Mean Absolute Error (MAE)</td>
<td valign="top" align="center">3.4672</td>
<td valign="top" align="center">1.4479</td>
<td valign="top" align="center">&#x2212;2.0193 (58.2&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">Mean Squared Error (MSE)</td>
<td valign="top" align="center">18.7308</td>
<td valign="top" align="center">3.5790</td>
<td valign="top" align="center">&#x2212;15.1518 (80.9&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">Root Mean Squared Error (RMSE)</td>
<td valign="top" align="center">4.3279</td>
<td valign="top" align="center">1.8918</td>
<td valign="top" align="center">&#x2212;2.4361 (56.3&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>R</italic><sup>2</sup> Score</td>
<td valign="top" align="center">0.7321</td>
<td valign="top" align="center">0.9603</td>
<td valign="top" align="center">&#x002B;0.2282 (31.2&#x0025;)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="table-fn3"><label><sup>a</sup></label>
<p>TRTR, training on real data and testing on real data; TSTR, training on synthetic data and testing on real data.</p></fn>
</table-wrap-foot>
</table-wrap>
<p><xref ref-type="fig" rid="F4">Figure&#x00A0;4</xref> displays the TRTR and TSTR models&#x2019; actual vs. predicted MoS values. For the TRTR model [<xref ref-type="fig" rid="F4">Figure&#x00A0;4A</xref>], while the model captured the general trend (<italic>R</italic><sup>2</sup>&#x2009;&#x003D;&#x2009;0.7321), variance is evident through the widespread scatter around the regression line. Prediction accuracy appeared limited at higher MoS values (&#x003E;30), with a dispersion of predictions. In contrast, the TSTR model [<xref ref-type="fig" rid="F4">Figure&#x00A0;4B</xref>] improved the prediction accuracy. The tighter clustering of points around the regression line visually confirmed the superior performance metrics (<italic>R</italic><sup>2</sup>&#x2009;&#x003D;&#x2009;0.9603). Prediction accuracy remained consistent across the entire range of MoS values, including at higher magnitudes where the TRTR model showed limitations.</p>
<fig id="F4" position="float"><label>Figure 4</label>
<caption><p>Comparison of predicted vs. actual Margin of Stability (MoS) values. <bold>(A)</bold> Model trained on real data and tested on real data (TRTR), with an <italic>R</italic><sup>2</sup> score of 0.7321, indicating the proportion of variance in the actual MoS values explained by the model predictions. <bold>(B)</bold> Model trained on synthetic data and tested on real data (TSTR), with an <italic>R</italic><sup>2</sup> score of 0.9603.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1646146-g004.tif"><alt-text content-type="machine-generated">Two scatter plots compare Predicted MoS versus Actual MoS. The left plot shows a moderate correlation with an R-squared value of 0.7321. The right plot shows a strong correlation with an R-squared value of 0.9603. Each plot has a line of best fit.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3c"><label>3.3</label><title>Feature attribution analysis</title>
<p>The SHAP (Shapley Additive Explanations) value analysis revealed redistributions of feature influence when using synthetic data. SHAP values quantified the contribution of each feature to model predictions, with higher values indicating a greater impact on the outcome. For example, as shown in <xref ref-type="table" rid="T9">Table&#x00A0;9</xref>, the Step Width Mean SHAP value increased by 128.3&#x0025;, better reflecting its established role in stability control. The &#x201C;Fall History&#x201D; increased the mean SHAP value (1789.3&#x0025;), suggesting enhanced sensitivity to this risk factor. The BMI increased the mean SHAP value (175.7&#x0025;). Finally, the CoM_Velocity decreased mean SHAP value (37.6&#x0025;), consistent with the inverse relationship with stability. This last one potentially happened because of the rank correlation-based constraint enforcement.</p>
<table-wrap id="T9" position="float"><label>Table 9</label>
<caption><p>Mean SHAP values comparison between models.</p></caption>
<table frame="hsides" rules="groups">
<colgroup>
<col align="left"/>
<col align="center"/>
<col align="center"/>
<col align="center"/>
</colgroup>
<thead>
<tr>
<th valign="top" align="left">Feature</th>
<th valign="top" align="center">TRTR</th>
<th valign="top" align="center">TSTR</th>
<th valign="top" align="center">Directional change</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Y_Coordinate_CoM</td>
<td valign="top" align="center">5.720624</td>
<td valign="top" align="center">5.469393</td>
<td valign="top" align="center">&#x2193; (4.4&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">X_Coordinate_CoM</td>
<td valign="top" align="center">0.733808</td>
<td valign="top" align="center">0.673718</td>
<td valign="top" align="center">&#x2193; (8.2&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">Step_Width</td>
<td valign="top" align="center">0.719645</td>
<td valign="top" align="center">1.642897</td>
<td valign="top" align="center">&#x2191; (128.3&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">BMI</td>
<td valign="top" align="center">0.587171</td>
<td valign="top" align="center">1.618933</td>
<td valign="top" align="center">&#x2191; (175.7&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">Age</td>
<td valign="top" align="center">0.479669</td>
<td valign="top" align="center">0.724091</td>
<td valign="top" align="center">&#x2191; (50.9&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">CoM_Velocity</td>
<td valign="top" align="center">0.289063</td>
<td valign="top" align="center">0.180252</td>
<td valign="top" align="center">&#x2193; (37.6&#x0025;)</td>
</tr>
<tr>
<td valign="top" align="left">Fall history</td>
<td valign="top" align="center">0.026910</td>
<td valign="top" align="center">0.508422</td>
<td valign="top" align="center">&#x2191; (1,789.3&#x0025;)</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>These shifts in SHAP values indicated that this synthetic data approach realigned model feature attribution to better reflect established gait principles, especially for the older adult population.</p>
<p><xref ref-type="fig" rid="F5">Figure&#x00A0;5</xref> demonstrates the feature attribution patterns for the TRTR and TSTR models. For TRTR [<xref ref-type="fig" rid="F5">Figure&#x00A0;5A</xref>], the horizontal distribution of points represented the SHAP value impact on model output, while color indicated feature value magnitude (blue for lower values, red for higher values). The <italic>Y_Coordinate_CoM</italic> showed the most influence on predictions, with positive and negative contributions depending on the value. <italic>Step_Width</italic> demonstrated a modest impact, particularly compared to the CoM-coordinates-based parameters. In contrast, <xref ref-type="fig" rid="F5">Figure&#x00A0;5B</xref> reveals the altered feature attribution pattern in the TSTR model. <italic>Step_Width</italic> gained greater impact in the predictions, rising to second position in importance. As mentioned before, this realignment better reflected established biomechanical principles regarding the role of step width in stability control. Fall History also showed enhanced contribution compared to the TRTR model, indicating improved sensitivity to risk factors.</p>
<fig id="F5" position="float"><label>Figure 5</label>
<caption><p>SHAP summary plot for TRTR <bold>(A)</bold> and TSTR <bold>(B)</bold> models. The color gradient reflects feature values, where red indicates higher feature values and blue indicates lower feature values.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="fspor-07-1646146-g005.tif"><alt-text content-type="machine-generated">Two SHAP value plots showing feature impacts on model output. Top plot includes features like Y and X Coordinates of Center of Mass (CoM), Step Width, BMI, Age, CoM Velocity, and Number of Falls. High feature values are in red; low values are in blue. Bottom plot orders X Coordinate CoM lower, highlighting Step Width's influence more prominently.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion"><label>4</label><title>Discussion</title>
<p>This study investigated the application of SDG to gait stability prediction in older adults, addressing three research questions about data fidelity and utility, predictive performance, and model interpretability. Our findings demonstrated that this synthetic data approach accurately replicates data properties of gait parameters and can also enhance predictive modeling capabilities beyond what is achievable with real-world data alone in older adults.</p>
<p>The high fidelity metrics, column shapes at 98.51&#x0025;, column pair trends at 95.67&#x0025;, and overall fidelity at 97.09&#x0025;, and subsequently preservation of variable distributions (above 0.97 in KSComplement and TVComplement scores) addressed an important challenge in movement science, maintaining biomechanical data validity whilst augmenting a limited dataset. For example, preserving categorical variables related to fall history (TVComplement&#x2009;&#x003D;&#x2009;1.00) is essential for clinical risk assessment applications. The low Hellinger distance (0.019) further confirmed the similarity between the original and synthetic distributions. Therefore, these findings demonstrated that our data-centric approach successfully captured univariate distributions and bivariate relationships. These fidelity metrics align with similar methodological approaches using evaluation metrics proposed by the Synthetic Data Vault (SDV) framework and/or Hellinger distance across all variables (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B55">55</xref>). Importantly (<xref ref-type="bibr" rid="B15">15</xref>), used SDV-based metrics, such as KSComplement, to assess the data fidelity of synthetic gait data generated for multiple sclerosis patients and demonstrated strong performance results with most metrics over 0.75. These findings advance beyond traditional statistical distribution matching approaches by demonstrating that constraint-based synthetic data can effectively embody relationships between domain-specific biomechanical variables. The implementation of rank correlation-based constraints to maintain established relationships between step width and margin of stability (<italic>&#x03C1;</italic>&#x2009;&#x003E;&#x2009;0.7) and between CoM velocity and stability margins (<italic>&#x03C1;</italic>&#x2009;&#x003C;&#x2009;&#x2212;0.3) represents a methodological solution in biomechanically-based SDG, depending on each research goal.</p>
<p>Regarding the data utility, the most significant finding is that models trained exclusively on synthetic data (TSTR) demonstrated superior predictive performance compared to models trained on real data alone (TRTR). The reductions in error metrics (MAE by 58.2&#x0025;, MSE by 80.9&#x0025;, and RMSE by 56.3&#x0025;) and improved variance explanation (<italic>R</italic><sup>2</sup> increase of 31.2&#x0025;) highlight the potential of the metadata configuration process used in this SDG application. These results align with the guidance from (<xref ref-type="bibr" rid="B19">19</xref>) for an SDG data-centric framework, emphasizing that high-quality synthetic data should achieve statistical fidelity and enhance utility in downstream tasks.</p>
<p>The predictive performance in <xref ref-type="fig" rid="F4">Figure&#x00A0;4</xref> further supports this interpretation, showing that while the TRTR model struggles with prediction accuracy at higher MoS values (&#x003E;30&#x2005;mm), the TSTR model maintains consistent accuracy across the entire range. This suggests that our SDG approach improved prediction accuracy at the boundaries of stability values, thus enhancing, with caution, reliability in assessing marginal dynamic stability profiles. For instance, an 85-year-old patient recovering from a mobility-constrained procedure with MoS values around 25&#x2013;35&#x2005;mm (where the TRTR model showed poor accuracy) could support a decision-making process that led to an unnecessarily prolonged rehabilitation procedure. The TSTR model&#x0027;s enhanced performance in this MoS range enables better identification of patients at the threshold of safe mobility, supporting responsible decision-making for this healthcare example.</p>
<p>The SHAP analysis revealed redistributions of feature influence in the TSTR model, with notable increases in the importance of Step Width (128.3&#x0025;), BMI (175.7&#x0025;), and Fall History (1,789.3&#x0025;). These changes suggest that the synthetic data generation process influenced the model&#x0027;s feature attribution patterns. Our findings relate to (<xref ref-type="bibr" rid="B56">56</xref>) research that, via a VICON motion capture system in 105 healthy individuals (52.87&#x2009;&#x00B1;&#x2009;19.09 years), demonstrated that step width (part of a &#x2018;base of support&#x2019; domain, as identified by the factor analysis, which included step width and step time) was a significant predictor of medio-lateral margin of stability, explaining 26&#x0025; of the variance (<italic>p</italic>&#x2009;&#x003C;&#x2009;0.0001). Their equipment setup differs from our low-cost computer vision footage-capturing approach, which makes our application emerge as an alternative for a wider clinical accessibility solution.</p>
<p>Therefore, this SHAP analysis reinforces two biomechanical principles: (1) step width serves as an active control mechanism for lateral stability, and (2) clinical history (previous falls) and anthropometric factors (BMI) influence gait stability strategies. Regarding a predictive-based perspective, CoM velocity demonstrated relatively low importance in both models (TRTR and TSTR), which appears contrary to established biomechanical theory regarding the inverse relationship between velocity and stability margins, which (<xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B57">57</xref>) demonstrated their relations that higher velocities can reduce the time available for corrective responses. This contrary relation to our findings can be explained by the experimental context of self-selected speeds. When participants walk at their preferred speed, they could optimize their gait pattern for stability and comfort, effectively minimizing the destabilizing effects of velocity that would be more apparent under imposed speed conditions. At self-selected speeds, older adults could adopt conservative velocity strategies that maintain their stability within comfortable margins, reducing the variance in velocity-stability relationships that machine learning models potentially rely on to detect feature importance. Therefore, this underscores the importance of considering the experimental context when interpreting SHAP values in gait modeling.</p>
<p>Our findings have significant implications for gait assessment in similar older adult populations. The SDG addresses persistent challenges, including limited sample sizes and constraints in extensive data collection from vulnerable populations. The improved predictive performance of the TSTR model suggests that synthetic data augmentation could enhance the accuracy of fall risk assessment tools based on stability metrics, particularly for the oldest-old population (&#x2265;85 years), where fall risk assessment carries the highest urgency (<xref ref-type="bibr" rid="B58">58</xref>), which aligns with the data that one-third of 70-year-olds and most 80-year-olds report mobility restrictions, which involves physical losses, including decreases in limb maximum muscle force and power (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B12">12</xref>).</p>
<sec id="s4a"><label>4.1</label><title>Limitations</title>
<p>Despite the promising results, some limitations exist: First, the sample size of 14 older adults we used, while comparable to many gait studies, remains relatively small for comprehensive synthetic data validation for this population. Future research should assess the scalability of a similar approach with more diverse cohorts representing different age groups, pathological conditions, and environmental contexts. Following this future perspective, for pathological populations (e.g., Parkinson&#x0027;s disease, stroke survivors), this SDG approach would require condition-specific constraint development. For instance, Parkinson&#x0027;s patients would potentially exhibit reduced step width variability and altered center of mass control, which would necessitate modified gait parameters correlation thresholds and potentially additional constraints reflecting disease-specific compensatory strategies. The SDG would need to preserve these pathological gait patterns whilst maintaining biomechanical plausibility.</p>
<p>Additionally, the dataset&#x0027;s composition (11 female, 3 male participants) reflects a gender imbalance that may limit the generalizability of our synthetic data generation approach. Future investigations should examine whether synthetic data generation maintains gender-specific biomechanical relationships and consider implementing gender-balanced original datasets for synthesis, or alternatively, generate synthetic data specifically for minority gender classes to address representation gaps. In other words, implement gender as a stratification variable in the metadata configuration, enabling the synthesizer to generate synthetic samples that maintain gender-specific proportions and biomechanical characteristics for synthetic data quality across gender groups.</p>
<p>Second, our SDG focused on frontal plane stability parameters derived from a single walking condition (level walking at self-paced speed). Thus, future work should extend this methodology to sagittal plane stability and responses to perturbations, which represent important aspects of stability control not captured in the current analysis. The SDG metadata configuration framework could accommodate frontal and sagittal plane parameters simultaneously, enabling the generation of synthetic data that preserves biomechanical relationships in both planes (e.g., coordination between medio-lateral and anterior-posterior stability strategies).</p>
<p>Third, while the MediaPipe algorithm provided acceptable pose tracking, advanced pose estimation algorithms optimized for biomechanical gait analysis could improve stability metrics&#x2019; precision and data quality. Advanced algorithms with improved joint tracking precision and enhanced robustness to occlusion could reduce measurement noise in center of mass calculations and step width detection, directly improving the accuracy of margin of stability computations.</p>
</sec>
<sec id="s4b"><label>4.2</label><title>Future clinical validation process</title>
<p>Our study demonstrates predictive-based SDG implementation in gait stability assessment, but comprehensive clinical validation is essential before widespread decision-making implementation. Critical validation steps include multi-site clinical trials across diverse healthcare settings to ensure methodology robustness, systematic testing in pathological populations (e.g., stroke survivors, Parkinson&#x0027;s disease patients, balance disorder patients) to validate synthetic data accuracy for clinical gait patterns, and longitudinal studies tracking patients over time to assess balance disorders prediction accuracy and rehabilitation monitoring capabilities. Additionally, clinical workflow integration requires practitioner usability studies, clinical decision support validation, and environmental robustness testing across different lighting conditions, clothes, and clinical environments to ensure smartphone-based pose tracking maintains accuracy in real-world settings.</p>
<p>Moreover, cost-effectiveness analysis comparing the methodology against current standard-of-care approaches, along with clinical outcome studies demonstrating improved patient outcomes, reduced falls, and enhanced quality of life, will be essential for healthcare adoption. Our current findings, relevant for stability assessment, provide an initial exploration for these validation efforts and position this methodology as a promising tool for low-cost gait stability assessment in clinical practice.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions"><label>5</label><title>Conclusion</title>
<p>This study demonstrates that SDG with specific biomechanically based constraints can accurately replicate gait stability parameters in older adults, addressing our three research questions regarding data fidelity, utility, and interpretability. First, our approach replicated gait parameter statistical properties with exceptional fidelity: column shapes (98.51&#x0025;), column pair trends (95.67&#x0025;), and overall fidelity (97.09&#x0025;), with variable distributions exceeding 0.97 in KSComplement and TVComplement scores and low Hellinger distance (0.019) confirming excellent alignment between original and synthetic distributions. Second, synthetic data-trained models (TSTR) demonstrated superior predictive performance compared to real data-trained models (TRTR), achieving substantial error reductions (MAE by 58.2&#x0025;, MSE by 80.9&#x0025;, RMSE by 56.3&#x0025;) and improved variance explanation (<italic>R</italic><sup>2</sup> increase of 31.2&#x0025;), whilst maintaining consistent accuracy across the entire MoS range, including at boundary stability values (&#x003E;30&#x2005;mm) where TRTR models showed limitations. Third, SHAP analysis revealed step width, BMI, and fall history as the most significant MoS predictors, with the synthetic data approach enhancing feature attribution alignment with established biomechanical principles through increased importance of step width (128.3&#x0025;), fall history (1,789.3&#x0025;), and BMI (175.7&#x0025;). The redistribution of feature importance in the TSTR model revealed this approach&#x0027;s strength: amplifying signals aligned with established gait stability principles, creating a more interpretable predictive framework. This approach, combined with accessible computer vision methodology, contributed to advancing gait stability assessment with implications for fall risk monitoring. By enabling accurate stability assessment through smartphone cameras rather than expensive motion capture systems, this methodology could help in scenarios where resources and mobility are limited for fall risk screening, enabling earlier interventions that improve decision-making from clinicians and physiotherapists, especially through similar explainable machine learning implementation. Moreover, the improved accuracy at boundary stability values supports precision-based gait stability assessment for the most vulnerable patients regarding the margin of stability. Future work should extend these SDG-data-driven methods to diverse populations and stability conditions, potentially developing new predictive-based stability assessment solutions with varied goals, including clinical settings.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability"><title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: the original and synthetic data generated in this study can be found at: <ext-link ext-link-type="uri" xlink:href="https://github.com/mauriciomau0/Gait-Stability-Prediction-Through-Synthetic-Time-Series-and-Vision-Based-Data">https://github.com/mauriciomau0/Gait-Stability-Prediction-Through-Synthetic-Time-Series-and-Vision-Based-Data</ext-link>. Additionally, the synthetic dataset was generated from a publicly available dataset that can be accessed here: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.6084/m9.figshare.c.5515953.v1">https://doi.org/10.6084/m9.figshare.c.5515953.v1</ext-link>.</p>
</sec>
<sec id="s7" sec-type="ethics-statement"><title>Ethics statement</title>
<p>The studies involving humans were approved by University of Toronto Ethics Board. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s8" sec-type="author-contributions"><title>Author contributions</title>
<p>MC: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. CO: Supervision, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. VN: Resources, Software, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. TR: Project administration, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<sec id="s9" sec-type="funding-information"><title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work has been funded by the Technological University of the Shannon (TUS) President&#x2019;s Doctoral Scholarship 2021.</p>
</sec>
<ack><title>Acknowledgments</title>
<p>We thank the researchers who shared this public dataset of older adults walking. We thank Dr. Brendan Kelly for his valuable effort in meetings, contributing to this research.</p>
</ack>
<sec id="s10" sec-type="COI-statement"><title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="ai-statement"><title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec id="s12" sec-type="disclaimer"><title>Publisher&#x0027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list><title>References</title>
<ref id="B1"><label>1.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Levine</surname><given-names>D</given-names></name><name><surname>Richards</surname><given-names>J</given-names></name><name><surname>Whittle</surname><given-names>MW</given-names></name></person-group>. <source>Whittle&#x2019;s Gait Analysis</source>. <publisher-loc>Elsevier Health Sciences</publisher-loc>: <publisher-name>Amsterdam</publisher-name> (<year>2012</year>).</citation></ref>
<ref id="B2"><label>2.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Badiye</surname><given-names>A</given-names></name><name><surname>Kathane</surname><given-names>P</given-names></name><name><surname>Krishan</surname><given-names>K</given-names></name></person-group>. <source>Forensic Gait Analysis</source>. <publisher-loc>Treasure Island, FL</publisher-loc>: <publisher-name>StatPearls Publishing</publisher-name> (<year>2021</year>).</citation></ref>
<ref id="B3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dewolf</surname><given-names>AH</given-names></name><name><surname>Sylos-Labini</surname><given-names>F</given-names></name><name><surname>Cappellini</surname><given-names>G</given-names></name><name><surname>Lacquaniti</surname><given-names>F</given-names></name><name><surname>Ivanenko</surname><given-names>Y</given-names></name></person-group>. <article-title>Emergence of different gaits in infancy: relationship between developing neural circuitries and changing biomechanics</article-title>. <source>Front Bioeng Biotechnol</source>. (<year>2020</year>) <volume>8</volume>:<fpage>473</fpage>. <pub-id pub-id-type="doi">10.3389/fbioe.2020.00473</pub-id><pub-id pub-id-type="pmid">32509753</pub-id></citation></ref>
<ref id="B4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dewolf</surname><given-names>AH</given-names></name><name><surname>Sylos-Labini</surname><given-names>F</given-names></name><name><surname>Cappellini</surname><given-names>G</given-names></name><name><surname>Ivanenko</surname><given-names>Y</given-names></name><name><surname>Lacquaniti</surname><given-names>F</given-names></name></person-group>. <article-title>Age-related changes in the neuromuscular control of forward and backward locomotion</article-title>. <source>PLoS One</source>. (<year>2021</year>) <volume>16</volume>(<issue>2</issue>):<fpage>e0246372</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0246372</pub-id><pub-id pub-id-type="pmid">33596223</pub-id></citation></ref>
<ref id="B5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname><given-names>S</given-names></name><name><surname>Fang</surname><given-names>J</given-names></name><name><surname>Hu</surname><given-names>X</given-names></name><name><surname>Ngai</surname><given-names>E</given-names></name><name><surname>Guo</surname><given-names>Y</given-names></name><name><surname>Leung</surname><given-names>V</given-names></name><etal/></person-group> <article-title>Emotion recognition from gait analyses: current research and future directions</article-title>. <source>IEEE Trans Comput Soc Syst</source>. (<year>2024</year>) <volume>11</volume>(<issue>1</issue>):<fpage>363</fpage>&#x2013;<lpage>77</lpage>. <pub-id pub-id-type="doi">10.1109/TCSS.2022.3223251</pub-id></citation></ref>
<ref id="B6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Santos</surname><given-names>PCRD</given-names></name><name><surname>Barbieri</surname><given-names>FA</given-names></name><name><surname>Zijdewind</surname><given-names>I</given-names></name><name><surname>Gobbi</surname><given-names>LTB</given-names></name><name><surname>Lamoth</surname><given-names>C</given-names></name><name><surname>Hortob&#x00E1;gyi</surname><given-names>T</given-names></name></person-group>. <article-title>Effects of experimentally induced fatigue on healthy older adults&#x2019; gait: a systematic review</article-title>. <source>PLoS One</source>. (<year>2019</year>) <volume>14</volume>(<issue>12</issue>):<fpage>e0226939</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0226939</pub-id><pub-id pub-id-type="pmid">31887182</pub-id></citation></ref>
<ref id="B7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ebersbach</surname><given-names>G</given-names></name><name><surname>Sojer</surname><given-names>M</given-names></name><name><surname>M&#x00FC;ller</surname><given-names>J</given-names></name><name><surname>Heijmenberg</surname><given-names>M</given-names></name><name><surname>Poewe</surname><given-names>W</given-names></name></person-group>. <article-title>Sociocultural differences in gait</article-title>. <source>Mov Disord</source>. (<year>2000</year>) <volume>15</volume>(<issue>6</issue>):<fpage>1145</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1002/1531-8257(200011)15:6%3C1145::aid-mds1013%3E3.0.co;2-c</pub-id><pub-id pub-id-type="pmid">11104198</pub-id></citation></ref>
<ref id="B8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bruijn</surname><given-names>SM</given-names></name><name><surname>Meijer</surname><given-names>OG</given-names></name><name><surname>Beek</surname><given-names>PJ</given-names></name><name><surname>van Die&#x00EB;n</surname><given-names>JH</given-names></name></person-group>. <article-title>Assessing the stability of human locomotion: a review of current measures</article-title>. <source>J R Soc Interface</source>. (<year>2013</year>) <volume>10</volume>(<issue>83</issue>):<fpage>20120999</fpage>. <pub-id pub-id-type="doi">10.1098/rsif.2012.0999</pub-id><pub-id pub-id-type="pmid">23516062</pub-id></citation></ref>
<ref id="B9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zanin</surname><given-names>M</given-names></name><name><surname>Olivares</surname><given-names>F</given-names></name><name><surname>Pulido-Valdeolivas</surname><given-names>I</given-names></name><name><surname>Rausell</surname><given-names>E</given-names></name><name><surname>Gomez-Andres</surname><given-names>D</given-names></name></person-group>. <article-title>Gait analysis under the lens of statistical physics</article-title>. <source>Comput Struct Biotechnol J</source>. (<year>2022</year>) <volume>20</volume>:<fpage>3257</fpage>&#x2013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.1016/j.csbj.2022.06.022</pub-id><pub-id pub-id-type="pmid">35782747</pub-id></citation></ref>
<ref id="B10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maresova</surname><given-names>P</given-names></name><name><surname>Krejcar</surname><given-names>O</given-names></name><name><surname>Maskuriy</surname><given-names>R</given-names></name><name><surname>Selamat</surname><given-names>A</given-names></name><name><surname>Melero</surname><given-names>FJ</given-names></name><name><surname>Kuca</surname><given-names>K</given-names></name></person-group>. <article-title>Challenges and opportunity in mobility among older adults&#x2014;key determinant identification</article-title>. <source>BMC Geriatr</source>. (<year>2023</year>) <volume>23</volume>(<issue>1</issue>):<fpage>447</fpage>. <pub-id pub-id-type="doi">10.1186/s12877-023-04106-7</pub-id><pub-id pub-id-type="pmid">37474928</pub-id></citation></ref>
<ref id="B11"><label>11.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Mochizuki</surname><given-names>L</given-names></name><name><surname>Aliberti</surname><given-names>S</given-names></name></person-group>. <article-title>Gait stability and aging</article-title>. In: <person-group person-group-type="editor"><name><surname>Barbieri</surname><given-names>FA</given-names></name><name><surname>Vit&#x00F3;rio</surname><given-names>R</given-names></name><name><surname>Santos</surname><given-names>PCR</given-names></name></person-group>, editors. <source>Locomotion and Posture in Older Adults</source>. <publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2024</year>). p. <fpage>7</fpage>. <pub-id pub-id-type="doi">10.1007/978-3-031-74123-4_7</pub-id></citation></ref>
<ref id="B12"><label>12.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grimmer</surname><given-names>M</given-names></name><name><surname>Riener</surname><given-names>R</given-names></name><name><surname>Walsh</surname><given-names>CJ</given-names></name><name><surname>Seyfarth</surname><given-names>A</given-names></name></person-group>. <article-title>Mobility related physical and functional losses due to aging and disease&#x2014;a motivation for lower limb exoskeletons</article-title>. <source>J Neuroeng Rehabil</source>. (<year>2019</year>) <volume>16</volume>(<issue>1</issue>):<fpage>2</fpage>. <pub-id pub-id-type="doi">10.1186/s12984-018-0458-8</pub-id><pub-id pub-id-type="pmid">30606194</pub-id></citation></ref>
<ref id="B13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Curtze</surname><given-names>C</given-names></name><name><surname>Buurke</surname><given-names>TJ</given-names></name><name><surname>McCrum</surname><given-names>C</given-names></name></person-group>. <article-title>Notes on the margin of stability</article-title>. <source>J Biomech</source>. (<year>2024</year>) <volume>166</volume>:<fpage>112045</fpage>. <pub-id pub-id-type="doi">10.1016/j.jbiomech.2024.112045</pub-id><pub-id pub-id-type="pmid">38484652</pub-id></citation></ref>
<ref id="B14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Trabassi</surname><given-names>D</given-names></name><name><surname>Castiglia</surname><given-names>SF</given-names></name><name><surname>Bini</surname><given-names>F</given-names></name><name><surname>Marinozzi</surname><given-names>F</given-names></name><name><surname>Ajoudani</surname><given-names>A</given-names></name><name><surname>Lorenzini</surname><given-names>M</given-names></name><etal/></person-group> <article-title>Optimizing rare disease gait classification through data balancing and generative AI: insights from hereditary cerebellar ataxia</article-title>. <source>Sensors</source>. (<year>2024</year>) <volume>24</volume>(<issue>11</issue>):<fpage>3613</fpage>. <pub-id pub-id-type="doi">10.3390/s24113613</pub-id><pub-id pub-id-type="pmid">38894404</pub-id></citation></ref>
<ref id="B15"><label>15.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Gall</surname><given-names>KL</given-names></name><name><surname>Bellanger</surname><given-names>L</given-names></name><name><surname>Laplaud</surname><given-names>D</given-names></name><name><surname>Stamm</surname><given-names>A</given-names></name></person-group>. <article-title>Generation of synthetic gait data: application to multiple sclerosis patients&#x2019; gait patterns</article-title>. <comment><italic>arXiv</italic> [Preprint]</comment>. (<year>2024</year>). <comment>Available online at:</comment> <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2411.10377">https://arxiv.org/abs/2411.10377</ext-link> (<comment>Accessed November 1, 2024</comment>).</citation></ref>
<ref id="B16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dindorf</surname><given-names>C</given-names></name><name><surname>Bartaguiz</surname><given-names>E</given-names></name><name><surname>Janssen</surname><given-names>A</given-names></name><name><surname>Ullrich</surname><given-names>P</given-names></name><name><surname>Schr&#x00F6;der</surname><given-names>J</given-names></name><name><surname>Kainz</surname><given-names>H</given-names></name><etal/></person-group> <article-title>Enhancing biomechanical machine learning with limited data: generating realistic synthetic posture data using generative artificial intelligence</article-title>. <source>Front Bioeng Biotechnol</source>. (<year>2024</year>) <volume>12</volume>:<fpage>1350135</fpage>. <pub-id pub-id-type="doi">10.3389/fbioe.2024.1350135</pub-id><pub-id pub-id-type="pmid">38419724</pub-id></citation></ref>
<ref id="B17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chavez</surname><given-names>JM</given-names></name><name><surname>Tang</surname><given-names>W</given-names></name></person-group>. <article-title>A vision-based system for stage classification of parkinsonian gait using machine learning and synthetic data</article-title>. <source>Sensors</source>. (<year>2022</year>) <volume>22</volume>(<issue>12</issue>):<fpage>4463</fpage>. <pub-id pub-id-type="doi">10.3390/s22124463</pub-id><pub-id pub-id-type="pmid">35746246</pub-id></citation></ref>
<ref id="B18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>de Souza</surname><given-names>MD</given-names></name><name><surname>Junior</surname><given-names>CRS</given-names></name><name><surname>Quintino</surname><given-names>J</given-names></name><name><surname>Santos</surname><given-names>AL</given-names></name><name><surname>da Silva</surname><given-names>FQ</given-names></name><name><surname>Zanchettin</surname><given-names>C</given-names></name></person-group>. <article-title>Exploring the impact of synthetic data on human activity recognition tasks</article-title>. <source>Procedia Comput Sci</source>. (<year>2023</year>) <volume>222</volume>:<fpage>656</fpage>&#x2013;<lpage>65</lpage>. <pub-id pub-id-type="doi">10.1016/j.procs.2023.08.203</pub-id></citation></ref>
<ref id="B19"><label>19.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lupi&#x00F3;n</surname><given-names>M</given-names></name><name><surname>Cruciani</surname><given-names>F</given-names></name><name><surname>Cleland</surname><given-names>I</given-names></name><name><surname>Nugent</surname><given-names>C</given-names></name><name><surname>Ortigosa</surname><given-names>PM</given-names></name></person-group>. <article-title>Data augmentation for human activity recognition with generative adversarial networks</article-title>. <source>IEEE J Biomed Health Inform</source>. (<year>2024</year>) <volume>28</volume>(<issue>4</issue>):<fpage>2350</fpage>&#x2013;<lpage>61</lpage>. <pub-id pub-id-type="doi">10.1109/JBHI.2024.3364910</pub-id></citation></ref>
<ref id="B20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hansen</surname><given-names>L</given-names></name><name><surname>Seedat</surname><given-names>N</given-names></name><name><surname>van der Schaar</surname><given-names>M</given-names></name><name><surname>Petrovic</surname><given-names>A</given-names></name></person-group>. <article-title>Reimagining synthetic tabular data generation through data-centric AI: a comprehensive benchmark</article-title>. <source>Adv Neural Inf Process Syst</source>. (<year>2023</year>) <volume>36</volume>:<fpage>33781</fpage>&#x2013;<lpage>823</lpage>. <pub-id pub-id-type="doi">10.5555/3666122.3667588</pub-id></citation></ref>
<ref id="B21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yoon</surname><given-names>J</given-names></name><name><surname>Jarrett</surname><given-names>D</given-names></name><name><surname>van der Schaar</surname><given-names>M</given-names></name></person-group>. <article-title>Time-series generative adversarial networks</article-title>. <source>Advances in Neural Information Processing Systems 32</source>. (<year>2019</year>).</citation></ref>
<ref id="B22"><label>22.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Esteban</surname><given-names>C</given-names></name><name><surname>Hyland</surname><given-names>SL</given-names></name><name><surname>R&#x00E4;tsch</surname><given-names>G</given-names></name></person-group>. <article-title>Real-valued (medical) time series generation with recurrent conditional GANs</article-title>. <comment><italic>arXiv</italic> [Preprint]</comment>. (<year>2017</year>). <comment>Available online at:</comment> <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1706.02633">https://arxiv.org/abs/1706.02633</ext-link> (<comment>Accessed May 20, 2025</comment>)</citation></ref>
<ref id="B23"><label>23.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Hyndman</surname><given-names>RJ</given-names></name><name><surname>Athanasopoulos</surname><given-names>G</given-names></name></person-group>. <source>Forecasting: Principles and Practice</source>. <publisher-loc>Melbourne</publisher-loc>: <publisher-name>OTexts</publisher-name> (<year>2018</year>).</citation></ref>
<ref id="B24"><label>24.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Chalapathy</surname><given-names>R</given-names></name><name><surname>Chawla</surname><given-names>S</given-names></name></person-group>. <article-title>Deep learning for anomaly detection: a survey</article-title>. <comment><italic>arXiv</italic> [Preprint]</comment>. (<year>2019</year>). <comment>Available online at:</comment> <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1901.03407">https://arxiv.org/abs/1901.03407</ext-link> (<comment>Accessed May 20, 2025</comment>).</citation></ref>
<ref id="B25"><label>25.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ng</surname><given-names>KD</given-names></name><name><surname>Mehdizadeh</surname><given-names>S</given-names></name><name><surname>Iaboni</surname><given-names>A</given-names></name><name><surname>Mansfield</surname><given-names>A</given-names></name><name><surname>Flint</surname><given-names>A</given-names></name><name><surname>Taati</surname><given-names>B</given-names></name></person-group>. <article-title>Measuring gait variables using computer vision to assess mobility and fall risk in older adults with dementia</article-title>. <source>IEEE J Transl Eng Health Med</source>. (<year>2020</year>) <volume>8</volume>:<fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1109/JTEHM.2020.2998326</pub-id></citation></ref>
<ref id="B26"><label>26.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>T</given-names></name><name><surname>Guestrin</surname><given-names>C</given-names></name></person-group>. <article-title>XGBoost: a scalable tree boosting system</article-title>. <conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name>; <publisher-name>ACM</publisher-name> (<year>2016</year>). p. <fpage>785</fpage>&#x2013;<lpage>94</lpage></citation></ref>
<ref id="B27"><label>27.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nohara</surname><given-names>Y</given-names></name><name><surname>Matsumoto</surname><given-names>K</given-names></name><name><surname>Soejima</surname><given-names>H</given-names></name><name><surname>Nakashima</surname><given-names>N</given-names></name></person-group>. <article-title>Explanation of machine learning models using shapley additive explanation and application for real data in hospital</article-title>. <source>Comput Methods Programs Biomed</source>. (<year>2022</year>) <volume>214</volume>:<fpage>106584</fpage>. <pub-id pub-id-type="doi">10.1016/j.cmpb.2021.106584</pub-id><pub-id pub-id-type="pmid">34942412</pub-id></citation></ref>
<ref id="B28"><label>28.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Taati</surname><given-names>B</given-names></name><name><surname>Mehdizadeh</surname><given-names>S</given-names></name><name><surname>Nabavi</surname><given-names>H</given-names></name><name><surname>Sabo</surname><given-names>A</given-names></name><name><surname>Arora</surname><given-names>T</given-names></name><name><surname>Iaboni</surname><given-names>A</given-names></name></person-group>. <article-title>The Toronto older adults gait archive: video and 3D inertial motion capture data of older adults&#x2019; walking</article-title>. <source>Figshare</source>. (<year>2022</year>). <pub-id pub-id-type="doi">10.6084/m9.figshare.c.5515953.v1</pub-id></citation></ref>
<ref id="B29"><label>29.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Bazarevsky</surname><given-names>V</given-names></name><name><surname>Grishchenko</surname><given-names>I</given-names></name><name><surname>Raveendran</surname><given-names>K</given-names></name><name><surname>Zhu</surname><given-names>T</given-names></name><name><surname>Zhang</surname><given-names>F</given-names></name><name><surname>Grundmann</surname><given-names>M</given-names></name></person-group>. <article-title>Blazepose: on-device real-time body pose tracking</article-title>. <comment><italic>arXiv</italic> [Preprint]</comment>. (<year>2020</year>). <comment>Available online at:</comment> <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2006.10204">https://arxiv.org/abs/2006.10204</ext-link> (<comment>Accessed May 15, 2025</comment>).</citation></ref>
<ref id="B30"><label>30.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Lin</surname><given-names>TY</given-names></name><name><surname>Maire</surname><given-names>M</given-names></name><name><surname>Belongie</surname><given-names>S</given-names></name><name><surname>Hays</surname><given-names>J</given-names></name><name><surname>Perona</surname><given-names>P</given-names></name><name><surname>Ramanan</surname><given-names>D</given-names></name><etal/></person-group> <article-title>Microsoft COCO: common objects in context</article-title>. In: Fleet D, Pajdla T, Schiele B, Tuytelaars T, editors. <source>Computer Vision&#x2013;ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6&#x2013;12, 2014, Proceedings, Part V 13</source>. <publisher-loc>Cham</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name> (<year>2014</year>). p. <fpage>740</fpage>&#x2013;<lpage>55</lpage>.</citation></ref>
<ref id="B31"><label>31.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lafayette</surname><given-names>TBG</given-names></name><name><surname>Kunst</surname><given-names>VHL</given-names></name><name><surname>Melo</surname><given-names>PVS</given-names></name><name><surname>Guedes</surname><given-names>PO</given-names></name><name><surname>Teixeira</surname><given-names>JMXN</given-names></name><name><surname>Vasconcelos</surname><given-names>CRD</given-names></name><etal/></person-group> <article-title>Validation of angle estimation based on body tracking data from RGB-D and RGB cameras for biomechanical assessment</article-title>. <source>Sensors</source>. (<year>2023</year>) <volume>23</volume>(<issue>1</issue>):<fpage>3</fpage>. <pub-id pub-id-type="doi">10.3390/s23010003</pub-id></citation></ref>
<ref id="B32"><label>32.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Hii</surname><given-names>CST</given-names></name><name><surname>Gan</surname><given-names>KB</given-names></name><name><surname>You</surname><given-names>HW</given-names></name><name><surname>Zainal</surname><given-names>N</given-names></name><name><surname>Ibrahim</surname><given-names>NM</given-names></name><name><surname>Azmin</surname><given-names>S</given-names></name></person-group>. <article-title>Frontal plane gait assessment using MediaPipe pose</article-title>. In: <person-group person-group-type="editor"><name><surname>Islam</surname><given-names>MT</given-names></name><name><surname>Misran</surname><given-names>N</given-names></name><name><surname>Singh</surname><given-names>MJ</given-names></name></person-group>, editors. <source>Proceedings of the 8th International Conference on Space Science and Communication. IconSpace 2023. Springer Proceedings in Physics, vol 303</source>. <publisher-loc>Singapore</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2024</year>). <pub-id pub-id-type="doi">10.1007/978-981-97-0142-1_34</pub-id></citation></ref>
<ref id="B33"><label>33.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Winter</surname><given-names>DA</given-names></name></person-group>. <source>Biomechanics and Motor Control of Human Movement</source>. <edition>4th Eds</edition> <publisher-loc>Hoboken</publisher-loc>: <publisher-name>John Wiley &#x0026; Sons</publisher-name> (<year>2009</year>).</citation></ref>
<ref id="B34"><label>34.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McKinney</surname><given-names>W</given-names></name></person-group>. <article-title>Pandas: a foundational python library for data analysis and statistics</article-title>. <source>Python High Perform Sci Comp</source>. (<year>2011</year>) <volume>14</volume>:<fpage>1</fpage>&#x2013;<lpage>9</lpage>.</citation></ref>
<ref id="B35"><label>35.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Virtanen</surname><given-names>P</given-names></name><name><surname>Gommers</surname><given-names>R</given-names></name><name><surname>Oliphant</surname><given-names>TE</given-names></name><name><surname>Haberland</surname><given-names>M</given-names></name><name><surname>Reddy</surname><given-names>T</given-names></name><name><surname>Cournapeau</surname><given-names>D</given-names></name><etal/></person-group> <article-title>Scipy 1.0: fundamental algorithms for scientific computing in python</article-title>. <source>Nat Methods</source>. (<year>2020</year>) <volume>17</volume>(<issue>3</issue>):<fpage>261</fpage>&#x2013;<lpage>72</lpage>. <pub-id pub-id-type="doi">10.1038/s41592-019-0686-2</pub-id><pub-id pub-id-type="pmid">32015543</pub-id></citation></ref>
<ref id="B36"><label>36.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Crenna</surname><given-names>F</given-names></name><name><surname>Rossi</surname><given-names>GB</given-names></name><name><surname>Berardengo</surname><given-names>M</given-names></name></person-group>. <article-title>Filtering biomechanical signals in movement analysis</article-title>. <source>Sensors</source>. (<year>2021</year>) <volume>21</volume>(<issue>13</issue>):<fpage>4580</fpage>. <pub-id pub-id-type="doi">10.3390/s21134580</pub-id><pub-id pub-id-type="pmid">34283131</pub-id></citation></ref>
<ref id="B37"><label>37.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sugiyama</surname><given-names>Y</given-names></name><name><surname>Uno</surname><given-names>K</given-names></name><name><surname>Matsui</surname><given-names>Y</given-names></name></person-group>. <article-title>Types of anomalies in two-dimensional video-based gait analysis in uncontrolled environments</article-title>. <source>PLoS Comput Biol</source>. (<year>2023</year>) <volume>19</volume>(<issue>1</issue>):<fpage>e1009989</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1009989</pub-id><pub-id pub-id-type="pmid">36656820</pub-id></citation></ref>
<ref id="B38"><label>38.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Brownlee</surname><given-names>J</given-names></name></person-group>. <source>How to use Statistics to Identify Outliers in Data</source>. <publisher-loc>San Francisco</publisher-loc>: <publisher-name>Machine Learning Mastery</publisher-name> (<year>2020</year>). <comment>Available online at:</comment> <ext-link ext-link-type="uri" xlink:href="https://machinelearningmastery.com/how-to-use-statistics-to-identify-outliers-in-data/">https://machinelearningmastery.com/how-to-use-statistics-to-identify-outliers-in-data/</ext-link> (<comment>Accessed May 30, 2025</comment>).</citation></ref>
<ref id="B39"><label>39.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Agarwal</surname><given-names>S</given-names></name></person-group>. <article-title>Data mining: data mining concepts and techniques</article-title>. <conf-name>2013 International Conference on Machine Intelligence and Research Advancement</conf-name>; <conf-loc>Katra, India</conf-loc>: <publisher-name>IEEE</publisher-name> (<year>2013</year>). p. <fpage>203</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1109/ICMIRA.2013.45</pub-id></citation></ref>
<ref id="B40"><label>40.</label><citation citation-type="book"><collab>YData</collab>. <source>Ydata-sdk (Version 2.0.0) [Computer Software]</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>YData AI</publisher-name> (<year>2024</year>). <comment>Available online at:</comment> <ext-link ext-link-type="uri" xlink:href="https://docs.fabric.ydata.ai/latest/sdk/">https://docs.fabric.ydata.ai/latest/sdk/</ext-link> (<comment>Accessed May 30, 2025</comment>).</citation></ref>
<ref id="B41"><label>41.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname><given-names>Y</given-names></name><name><surname>Luo</surname><given-names>Z</given-names></name><name><surname>Li</surname><given-names>J</given-names></name><name><surname>Du</surname><given-names>J</given-names></name><name><surname>Sun</surname><given-names>D</given-names></name><name><surname>Ivanenko</surname><given-names>Y</given-names></name><etal/></person-group> <article-title>The biomechanical influence of step width on typical locomotor activities: a systematic review</article-title>. <source>Sports Med Open</source>. (<year>2024</year>) <volume>10</volume>(<issue>1</issue>):<fpage>83</fpage>. <pub-id pub-id-type="doi">10.1186/s40798-024-00750-4</pub-id><pub-id pub-id-type="pmid">39068296</pub-id></citation></ref>
<ref id="B42"><label>42.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dingwell</surname><given-names>JB</given-names></name><name><surname>Marin</surname><given-names>LC</given-names></name></person-group>. <article-title>Kinematic variability and local dynamic stability of upper body motions when walking at different speeds</article-title>. <source>J Biomech</source>. (<year>2006</year>) <volume>39</volume>:<fpage>444</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbiomech.2004.12.014</pub-id><pub-id pub-id-type="pmid">16389084</pub-id></citation></ref>
<ref id="B43"><label>43.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>England</surname><given-names>SA</given-names></name><name><surname>Granata</surname><given-names>KP</given-names></name></person-group>. <article-title>The influence of gait speed on local dynamic stability of walking</article-title>. <source>Gait Posture</source>. (<year>2007</year>) <volume>25</volume>:<fpage>172</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1016/j.gaitpost.2006.03.003</pub-id><pub-id pub-id-type="pmid">16621565</pub-id></citation></ref>
<ref id="B44"><label>44.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Patki</surname><given-names>N</given-names></name><name><surname>Wedge</surname><given-names>R</given-names></name><name><surname>Veeramachaneni</surname><given-names>K</given-names></name></person-group>. <article-title>The synthetic data vault</article-title>. <conf-name>IEEE International Conference on Data Science and Advanced Analytics (DSAA)</conf-name>; <publisher-name>IEEE</publisher-name> (<year>2016</year>). p. <fpage>399</fpage>&#x2013;<lpage>410</lpage>. <pub-id pub-id-type="doi">10.1109/DSAA.2016.49</pub-id></citation></ref>
<ref id="B45"><label>45.</label><citation citation-type="book"><collab>DataCebo Inc</collab>. <source>Synthetic Data Metrics (Version 0.17.0) [Computer Software]</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name> (<year>2023</year>). <comment>Available online at:</comment> <ext-link ext-link-type="uri" xlink:href="https://docs.sdv.dev/sdmetrics/">https://docs.sdv.dev/sdmetrics/</ext-link> (<comment>Accessed May 30, 2025</comment>).</citation></ref>
<ref id="B46"><label>46.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Berger</surname><given-names>VW</given-names></name><name><surname>Zhou</surname><given-names>Y</given-names></name></person-group>. <article-title>Kolmogorov&#x2013;smirnov test: overview</article-title>. In: <person-group person-group-type="editor"><name><surname>Balakrishnan</surname><given-names>N</given-names></name><name><surname>Colton</surname><given-names>T</given-names></name><name><surname>Everitt</surname><given-names>B</given-names></name><name><surname>Piegorsch</surname><given-names>W</given-names></name><name><surname>Ruggeri</surname><given-names>F</given-names></name><name><surname>Teugels</surname><given-names>JL</given-names></name></person-group>, editors. <source>Wiley StatsRef: Statistics Reference Online</source>. <publisher-loc>Hoboken</publisher-loc>: <publisher-name>John Wiley &#x0026; Sons</publisher-name> (<year>2014</year>). <pub-id pub-id-type="doi">10.1002/9781118445112.stat06558</pub-id></citation></ref>
<ref id="B47"><label>47.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Oosterhoff</surname><given-names>J</given-names></name><name><surname>van Zwet</surname><given-names>WR</given-names></name></person-group>. <article-title>A note on contiguity and hellinger distance</article-title>. In: <person-group person-group-type="editor"><name><surname>van de Geer</surname><given-names>S</given-names></name><name><surname>Wegkamp</surname><given-names>M</given-names></name></person-group>, editors. <source>Selected Works of Willem van Zwet. Selected Works in Probability and Statistics</source>. <publisher-loc>New York</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2012</year>). <pub-id pub-id-type="doi">10.1007/978-1-4614-1314-1_6</pub-id></citation></ref>
<ref id="B48"><label>48.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Noh</surname><given-names>B</given-names></name><name><surname>Youm</surname><given-names>C</given-names></name><name><surname>Goh</surname><given-names>E</given-names></name><name><surname>Lee</surname><given-names>M</given-names></name><name><surname>Park</surname><given-names>H</given-names></name><name><surname>Jeon</surname><given-names>H</given-names></name><etal/></person-group> <article-title>XGBoost based machine learning approach to predict the risk of fall in older adults using gait outcomes</article-title>. <source>Sci Rep</source>. (<year>2021</year>) <volume>11</volume>(<issue>1</issue>):<fpage>12183</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-021-91797-w</pub-id><pub-id pub-id-type="pmid">34108595</pub-id></citation></ref>
<ref id="B49"><label>49.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vora</surname><given-names>C</given-names></name><name><surname>Katkar</surname><given-names>V</given-names></name><name><surname>Lunagaria</surname><given-names>M</given-names></name></person-group>. <article-title>Gait analysis based on gender detection using pre-trained models and tune parameters</article-title>. <source>Discov Artif Intell</source>. (<year>2024</year>) <volume>4</volume>:<fpage>19</fpage>. <pub-id pub-id-type="doi">10.1007/s44163-024-00115-6</pub-id></citation></ref>
<ref id="B50"><label>50.</label><citation citation-type="confproc"><person-group person-group-type="author"><name><surname>Park</surname><given-names>B</given-names></name><name><surname>Kim</surname><given-names>M</given-names></name><name><surname>Jung</surname><given-names>D</given-names></name><name><surname>Lee</surname><given-names>D</given-names></name><name><surname>Kim</surname><given-names>J</given-names></name><name><surname>Mun</surname><given-names>KR</given-names></name></person-group>. <article-title>Classification of abnormal gaits with machine learning algorithms using sensor-inherited insoles</article-title>. <conf-name>2024 46th Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)</conf-name>; <conf-loc>Orlando, FL, USA</conf-loc>: <publisher-name>IEEE</publisher-name> (<year>2024</year>). p. <fpage>1</fpage>&#x2013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1109/EMBC53108.2024.10782460</pub-id></citation></ref>
<ref id="B51"><label>51.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dey</surname><given-names>A</given-names></name></person-group>. <article-title>Machine learning algorithms: a review</article-title>. <source>Int J Comput Sci Inf Technol</source>. (<year>2016</year>) <volume>7</volume>:<fpage>1174</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1109/EMBC53108.2024.10782460</pub-id></citation></ref>
<ref id="B52"><label>52.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Agrawal</surname><given-names>S</given-names></name><name><surname>Yadala</surname><given-names>R</given-names></name><name><surname>Goyal</surname><given-names>P</given-names></name><name><surname>Bharti</surname><given-names>J</given-names></name></person-group>. <article-title>Gait movement analysis using polynomial regression</article-title>. <source>Int J Res Appl Sci Eng Technol</source>. (<year>2022</year>) <volume>10</volume>(<issue>3</issue>):<fpage>2393</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.22214/ijraset.2022.40979</pub-id></citation></ref>
<ref id="B53"><label>53.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ozates</surname><given-names>ME</given-names></name><name><surname>Salami</surname><given-names>F</given-names></name><name><surname>Wolf</surname><given-names>SI</given-names></name><name><surname>Arslan</surname><given-names>YZ</given-names></name></person-group>. <article-title>Estimating ground reaction forces from gait kinematics in cerebral palsy: a convolutional neural network approach</article-title>. <source>Ann Biomed Eng</source>. (<year>2025</year>) <volume>53</volume>:<fpage>634</fpage>&#x2013;<lpage>43</lpage>. <pub-id pub-id-type="doi">10.1007/s10439-024-03658-y</pub-id><pub-id pub-id-type="pmid">39616286</pub-id></citation></ref>
<ref id="B54"><label>54.</label><citation citation-type="book"><person-group person-group-type="author"><name><surname>Li</surname><given-names>X</given-names></name><name><surname>Zhou</surname><given-names>Y</given-names></name><name><surname>Dvornek</surname><given-names>N</given-names></name><name><surname>Gu</surname><given-names>Y</given-names></name><name><surname>Ventola</surname><given-names>P</given-names></name><name><surname>Duncan</surname><given-names>J</given-names></name></person-group>. <article-title>Efficient shapley explanation for features importance estimation under uncertainty</article-title>. In: Martel AL, Abolmaesumi P, Stoyanov D, Mateus D, Zuluaga MA, Zhou SK, et al., editors. <source>Medical Image Computing and Computer-Assisted Intervention&#x2014;MICCAI 2020. Lecture Notes in Computer Science, vol 12261</source>. <publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2020</year>). p. <fpage>792</fpage>&#x2013;<lpage>801</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-030-59710-8_77</pub-id></citation></ref>
<ref id="B55"><label>55.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Emam K</surname><given-names>E</given-names></name><name><surname>Mosquera</surname><given-names>L</given-names></name><name><surname>Fang</surname><given-names>X</given-names></name><name><surname>El-Hussuna</surname><given-names>A</given-names></name></person-group>. <article-title>Utility metrics for evaluating synthetic health data generation methods: validation study</article-title>. <source>JMIR Med Inform</source>. (<year>2022</year>) <volume>10</volume>(<issue>4</issue>):<fpage>e35734</fpage>. <pub-id pub-id-type="doi">10.2196/35734</pub-id><pub-id pub-id-type="pmid">35389366</pub-id></citation></ref>
<ref id="B56"><label>56.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Herssens</surname><given-names>N</given-names></name><name><surname>van Criekinge</surname><given-names>T</given-names></name><name><surname>Saeys</surname><given-names>W</given-names></name><name><surname>Truijen</surname><given-names>S</given-names></name><name><surname>Vereeck</surname><given-names>L</given-names></name><name><surname>van Rompaey</surname><given-names>V</given-names></name><etal/></person-group> <article-title>An investigation of the spatio-temporal parameters of gait and margins of stability throughout adulthood</article-title>. <source>J R Soc Interface</source>. (<year>2020</year>) <volume>17</volume>(<issue>166</issue>):<fpage>20200194</fpage>. <pub-id pub-id-type="doi">10.1098/rsif.2020.0194</pub-id><pub-id pub-id-type="pmid">32429825</pub-id></citation></ref>
<ref id="B57"><label>57.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hak</surname><given-names>L</given-names></name><name><surname>Houdijk</surname><given-names>H</given-names></name><name><surname>Steenbrink</surname><given-names>F</given-names></name><name><surname>Mert</surname><given-names>A</given-names></name><name><surname>van der Wurff</surname><given-names>P</given-names></name><name><surname>Beek</surname><given-names>PJ</given-names></name><etal/></person-group> <article-title>Speeding up or slowing down?: gait adaptations to preserve gait stability in response to balance perturbations</article-title>. <source>Gait Posture</source>. (<year>2012</year>) <volume>36</volume>(<issue>2</issue>):<fpage>260</fpage>&#x2013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1016/j.gaitpost.2012.03.005</pub-id><pub-id pub-id-type="pmid">22464635</pub-id></citation></ref>
<ref id="B58"><label>58.</label><citation citation-type="journal"><collab>Centers for Disease Control and Prevention (CDC)</collab>. <article-title>Self-reported falls and fall-related injuries among persons aged &#x2265;65 years&#x2014;United States, 2006</article-title>. <source>MMWR Morb Mortal Wkly Rep</source>. (<year>2008</year>) <volume>57</volume>(<issue>9</issue>):<fpage>225</fpage>&#x2013;<lpage>9</lpage>.<pub-id pub-id-type="pmid">18322444</pub-id></citation></ref>
<ref id="B59"><label>59.</label><citation citation-type="other"><article-title>MediaPipe Pose</article-title>. (<year>2024</year>). <comment>Available online at:</comment> <ext-link ext-link-type="uri" xlink:href="https://github.com/google-ai-edge/mediapipe/blob/master/docs/solutions/pose.md">https://github.com/google-ai-edge/mediapipe/blob/master/docs/solutions/pose.md</ext-link> (<comment>Accessed May 20, 2025</comment>).</citation></ref></ref-list>
</back>
</article>