<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Public Health</journal-id>
<journal-title-group>
<journal-title>Frontiers in Public Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Public Health</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-2565</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpubh.2026.1729879</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Determinants of work-related musculoskeletal disorders among coal miners in Jining, China: development of a predictive risk model</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes"><name><surname>Li</surname> <given-names>Jiali</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3360127"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes"><name><surname>Zhang</surname> <given-names>Xuemei</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author" equal-contrib="yes"><name><surname>Li</surname> <given-names>Yuchen</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="author-notes" rid="fn0001"><sup>&#x2020;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3250104"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author"><name><surname>Ding</surname> <given-names>Wenwen</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1270886"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author"><name><surname>Duan</surname> <given-names>Wenhua</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1135875"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author"><name><surname>Lim</surname> <given-names>David</given-names></name><xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2607543"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
</contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Liang</surname> <given-names>Yumin</given-names></name><xref ref-type="aff" rid="aff2"><sup>2</sup></xref><xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
</contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Feng</surname> <given-names>Zhihui</given-names></name><xref ref-type="aff" rid="aff1"><sup>1</sup></xref><xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1182046"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Department of Labor Hygiene and Environmental Hygiene, School of Public Health, Cheeloo College of Medicine, Shandong University</institution>, <city>Jinan</city>, <country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>Jining City Centre for Disease Control and Prevention</institution>, <city>Jining</city>, <country country="cn">China</country></aff>
<aff id="aff3"><label>3</label><institution>Faculty of Health, University of Technology Sydney</institution>, <city>Ultimo</city>, <state>NSW</state>, <country country="au">Australia</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: Zhihui Feng, <email xlink:href="mailto:fengzhihui@sdu.edu.cn">fengzhihui@sdu.edu.cn</email>; Yumin Liang, <email xlink:href="mailto:lymin001@163.com">lymin001@163.com</email></corresp>
<fn fn-type="equal" id="fn0001">
<label>&#x2020;</label>
<p>These authors have contributed equally to this work and share first authorship</p>
</fn>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-05">
<day>05</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>14</volume>
<elocation-id>1729879</elocation-id>
<history>
<date date-type="received">
<day>22</day>
<month>10</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>22</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>22</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Li, Zhang, Li, Ding, Duan, Lim, Liang and Feng.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Li, Zhang, Li, Ding, Duan, Lim, Liang and Feng</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-05">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Work-related musculoskeletal disorders (WMSD) are highly prevalent among coal miners and pose a significant threat to occupational health. Understanding the underlying risk factors and developing a predictive model for WMSD risk can help to mitigate WMSD.</p>
</sec>
<sec>
<title>Objective</title>
<p>To identify key determinants of WMSD among coal miners in Jinang, China, and construct a predictive model to assess risk.</p>
</sec>
<sec>
<title>Methods</title>
<p>One thousand four hundred nine coal miners from two coal mining companies were surveyed using the modified Chinese Muscle Questionnaire (CMQ). Prevalence rates and risk factors were assessed using logistic regression. Machine learning algorithms were applied to construct the predictive model.</p>
</sec>
<sec>
<title>Results</title>
<p>The 12-month overall prevalence of WMSD was 82%, with the neck (59.5%), shoulders (53.4%), and lower back (46.5%) being the most affected. Eight variables, including smoking behaviors, perceived health status, and uncomfortable working posture, were significantly associated with WMSD (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05). The neural network model achieved the highest performance (area under the curve: 0.886 on training and 0.704 on test). The fused model outperformed individual models in the final stacking integration learning.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>Work-related musculoskeletal disorders are highly prevalent among Chinese coal miners and are influenced by personal and work-related factors. Machine learning models, particularly ensemble approaches, offer promise for risk prediction and targeted prevention.</p>
</sec>
</abstract>
<kwd-group>
<kwd>coal miners</kwd>
<kwd>machine learning</kwd>
<kwd>predictive model</kwd>
<kwd>risk factors</kwd>
<kwd>work-related musculoskeletal disorders</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This study was supported by the National Natural Science Foundation of China (Project No. 82173460).</funding-statement>
</funding-group>
<counts>
<fig-count count="1"/>
<table-count count="11"/>
<equation-count count="0"/>
<ref-count count="36"/>
<page-count count="14"/>
<word-count count="8704"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Occupational Health and Safety</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Work-related musculoskeletal disorders (WMSD) are a category of cumulative injuries affecting the musculoskeletal system and refer to injuries and disorders that occur to muscles, nerves, tendons, ligaments, joints, cartilage, and intervertebral disks (<xref ref-type="bibr" rid="ref1">1</xref>). WMSD symptoms usually develop gradually over a period of time rather than being caused by a single traumatic event (<xref ref-type="bibr" rid="ref2">2</xref>). WMSD can be caused by prolonged maintenance of specific static positions or postures, and by repetitive movements required by specific job tasks. It mainly affects the neck, shoulders, limbs, and back and lumbar region (<xref ref-type="bibr" rid="ref3">3</xref>). WMSD not only affects the quality of life of individual workers but also imposes a significant economic burden on society through reduced operational efficiency (reduced productivity, increased absenteeism), affected workforce stability (increased turnover, early retirement), increased costs (medical expenses, insurance and compensation), and psychological distress. WMSD is one of the world&#x2019;s most pressing health challenges (<xref ref-type="bibr" rid="ref4">4</xref>). The recent Global Burden of Disease Study 2019 estimated that approximately 1.71 billion people worldwide are affected by musculoskeletal disorders, this represents the most significant contributor to overall disease prevalence globally (<xref ref-type="bibr" rid="ref5">5</xref>). WMSDs rank second among occupational diseases in many European and North American countries. In the United States (US), WMSDs represent the fastest-growing category of occupational illness, resulting in annual workers&#x2019; compensation and insurance costs amounting to tens of billions of US dollars. In Europe, approximately 30% of workers report experiencing back pain, underscoring the substantial burden of musculoskeletal conditions in the workforce. In Japan, WMSDs constitute the largest category of work-related diseases, accounting for one-third or more of all registered occupational diseases (<xref ref-type="bibr" rid="ref6">6</xref>). Evidence from China similarly indicates a high prevalence of WMSDs in occupational groups. In manufacturing settings, a meta-analysis focusing on China&#x2019;s automobile manufacturing industry estimated a pooled 12-month WMSDs prevalence of 53.1% (<xref ref-type="bibr" rid="ref7">7</xref>).</p>
<p>While China has pledged to achieve carbon neutrality by 2060, coal remains central to the country&#x2019;s energy infrastructure. As the world&#x2019;s largest producer of raw coal, China employs millions of workers across coal mining, processing, washing, and beneficiation sectors (<xref ref-type="bibr" rid="ref8">8</xref>). Coal miners represent a distinct occupational group due to their exposure to high-stress conditions and harsh environments. Their work involves prolonged exposure to dust, chemical agents, physical strain, and biological hazards, factors that collectively contribute to psychological stress, job fatigue, and burnout (<xref ref-type="bibr" rid="ref9">9</xref>). Among the health challenges faced by this workforce, WMSD has emerged as a particularly pressing concern (<xref ref-type="bibr" rid="ref10">10</xref>). Globally, coal miners exhibit a notably high prevalence of WMSD, underscoring the need for targeted occupational health interventions (<xref ref-type="bibr" rid="ref11">11</xref>).</p>
<p>While several factors are known to be associated with WMSD, their relative impact can vary depending on region, occupational, and individual differences. These risk factors have different effects on the body, leading to diverse manifestations of WMSD (<xref ref-type="bibr" rid="ref12">12</xref>). Research on predictive models of WMSD pertaining to coal mining is limited (<xref ref-type="bibr" rid="ref13">13</xref>). Advancement in technology, such as machine learning, offers an opportunity to harness data to better predict the determinants of WMSD.</p>
<p>In this study, a modified version of the musculoskeletal questionnaire was used to identify the risk factors for WMSDs. Machine learning algorithms were used to construct a prediction model for WMSD based on the collected data. The goal is to provide a scientifically grounded approach for the prevention and protection of workers&#x2019; health.</p>
</sec>
<sec sec-type="materials|methods" id="sec2">
<label>2</label>
<title>Materials and methods</title>
<sec id="sec3">
<label>2.1</label>
<title>Study design and setting</title>
<p>This study employed a cross-sectional design to investigate the prevalence and determinants of work-related musculoskeletal disorders (WMSDs) among frontline coal mining workers and to develop predictive models for WMSD risk using both traditional statistical methods and machine learning algorithms. This study was reported in accordance with the Strengthening the Reporting of Observational Studies in Epidemiology (STROBE) statement: guidelines for reporting observational studies (<xref ref-type="bibr" rid="ref14">14</xref>). The cross-sectional survey was conducted between January and February 2024 in two coal mining companies in Jining City, Shandong Province, China.</p>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>Participants</title>
<sec id="sec5">
<label>2.2.1</label>
<title>Comparability of participants</title>
<p>The study population comprised frontline operational workers employed at two coal mining enterprises in Jining City, Shandong Province. The two participating coal mining companies were broadly comparable in terms of organizational structure, each comprising similar production departments, frontline job categories and descriptions, and occupational health and safety management systems. With respect to job responsibilities and work equipment, workers in both companies were primarily engaged in coal extraction, tunneling, and related underground auxiliary operations. The nature of the work and the production equipment used were consistent with standard practices in the coal mining industry and were therefore highly comparable. Regarding working hours, both companies operated a shift-based system; however, the schedules differ: a 40-h work week in one company and a 36-h work week in the other. Overall, despite these differences in weekly working hours, the two companies were comparable in terms of job characteristics and descriptions, working environments, and potential occupational exposure profiles.</p>
</sec>
<sec id="sec6">
<label>2.2.2</label>
<title>Eligibility criteria and participant selection</title>
<p>Frontline operational workers were eligible for inclusion if they met the following criteria:</p>
<list list-type="alpha-lower">
<list-item>
<p>in full-time employment for more than 1 year.</p>
</list-item>
<list-item>
<p>&#x2265;18&#x202F;years old.</p>
</list-item>
<list-item>
<p>No language or communication barriers.</p>
</list-item>
<list-item>
<p>Provided express and informed consent to participate in this study.</p>
</list-item>
</list>
<p>Workers with musculoskeletal disorders due to infectious diseases, rheumatism, malignant tumors, congenital disorders and other non-occupational causes were excluded.</p>
<p>Professional staff from Shandong University School of Public Health and Jining Center for Disease Control and Prevention were responsible for subject selection. These investigators possessed backgrounds in public health and preventive medicine, along with extensive experience in questionnaire surveys. Prior to the survey commencement, investigators received systematic training on the study objectives, inclusion criteria, and data collection procedures. All eligible active-duty personnel were consecutively invited to participate. Prior to formal questionnaire distribution, all workers received a unified briefing explaining the study objectives, detailing the questionnaire completion process, and outlining relevant precautions. Participants voluntarily enrolled after receiving full informed consent and independently completed the questionnaires. To ensure data quality and procedural standardization, the questionnaire incorporated automatic logic checks and mandatory fields, with real-time monitoring of completion progress. During completion, on-site investigators addressed any participant inquiries without influencing or interfering with responses, thereby minimizing potential selection and information biases.</p>
</sec>
<sec id="sec7">
<label>2.2.3</label>
<title>Ethical considerations</title>
<p>Ethical approval was obtained independently from the School of Public Health, Shandong University (LL20231201), in accordance with the Declaration of Helsinki on the responsible and ethical conduct of human research.</p>
</sec>
</sec>
<sec id="sec8">
<label>2.3</label>
<title>Sample size</title>
<p>The minimum sample size required was 483 (based on <italic>&#x03B1;</italic>&#x202F;=&#x202F;0.05 and &#x1D6FF; = 0.03, with a further 20% non-response rate). The final sample size obtained was 1,409. This larger sample size was expected to improve the robustness and stability of the multivariable models.</p>
</sec>
<sec id="sec9">
<label>2.4</label>
<title>Instrument and data collection</title>
<sec id="sec10">
<label>2.4.1</label>
<title>Questionnaire</title>
<p>Data were collected using a validated and established, modified Chinese Musculoskeletal Questionnaire (CMQ), adapted from the Nordic Musculoskeletal Questionnaire (<xref ref-type="bibr" rid="ref15">15</xref>, <xref ref-type="bibr" rid="ref16">16</xref>). The CMQ has been previously tested for validity and reliability in various Chinese occupational groups (<xref ref-type="bibr" rid="ref3">3</xref>, <xref ref-type="bibr" rid="ref4">4</xref>).</p>
<p>The questionnaire consisted of three sections:</p>
<list list-type="alpha-lower">
<list-item>
<p>Demographic factors (gender, age, years of work experience, and marital status),</p>
</list-item>
<list-item>
<p>Self-reported musculoskeletal symptoms (body parts, frequency, intensity and duration),</p>
</list-item>
<list-item>
<p>Occupational exposure-related factors.</p>
</list-item>
</list>
</sec>
<sec id="sec11">
<label>2.4.2</label>
<title>Quality control</title>
<p>Before data collection, trained investigators provided a standardized briefing to participants, explaining the study objectives, questionnaire content, and completion procedures. The survey was conducted using a face-to-face electronic questionnaire developed on the Wenjuanxing platform, with participants completing the questionnaire independently by scanning a QR code on their mobile devices. Communication between participants was not permitted during completion, and investigators offered standardized guidance without interfering with responses. To ensure data quality, the questionnaire incorporated mandatory fields and automated logical consistency checks, and completion progress was monitored in real time. Any questions raised during the survey were addressed by trained investigators to facilitate accurate and complete data collection while minimizing information bias.</p>
</sec>
</sec>
<sec id="sec12">
<label>2.5</label>
<title>Data analysis</title>
<p>Descriptive statistics were used to summarize the basic characteristics. Continuous variables were reported as medians and interquartile ranges, while categorical variables were expressed as frequencies and percentages. Differences between groups were compared using Pearson&#x2019;s chi-square (<italic>&#x03C7;</italic><sup>2</sup>) test or Fisher&#x2019;s exact probability method, as appropriate. Multivariate logistic regression analysis was employed to identify independent risk factors for WMSD. Variables with statistically significant associations in univariate analyses (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05) were included in the regression model.</p>
</sec>
<sec id="sec13">
<label>2.6</label>
<title>Machine learning algorithm</title>
<p>Drawing on prior literature and the application of machine learning methods to occupational health risk prediction, this study employed multiple supervised learning algorithms to develop predictive models for WMSD risk among coal miners. All models were constructed after completing data preprocessing procedures, including variable encoding, standardization, and handling of missing values. Model development and analysis were conducted using the R software environment (version 4.1.2). To ensure reproducibility, a unified random seed (seed&#x202F;=&#x202F;123) was applied across all model training processes.</p>
<p>A total of six machine learning algorithms were included in this study: random forest (RF), decision tree (DT), neural network (NN), Na&#x00EF;ve Bayes (NB), support vector machine (SVM), and k-nearest neighbors (K-NN). WMSD occurrence was specified as the dependent variable, and feature variables identified by logistic regression were used as independent variables. Model outputs were expressed as individual predicted probabilities of WMSD occurrence (ranging from 0 to 1). Risk stratification was performed based on these predicted probabilities, with consistent thresholds applied across all models to define high risk (&#x003E;0.65), low risk (&#x003C;0.35), and intermediate risk categories.</p>
<sec id="sec14">
<label>2.6.1</label>
<title>Model introduction and parameter settings</title>
<sec id="sec15">
<label>2.6.1.1</label>
<title>Random forest model (RF)</title>
<p>A random forest model is a supervised learning algorithm based on ensemble learning, which reduces the risk of overfitting and improves model generalizability by constructing multiple decision trees and aggregating their prediction results. In this study, a classification model was developed using the randomForest package in R. The number of trees was set to 500 (ntree&#x202F;=&#x202F;500), and the number of variables randomly selected at each node split was set to 8 (mtry&#x202F;=&#x202F;8). This approach is well-suited for high-dimensional data, demonstrates strong robustness to noise and missing values, and provides measures of variable importance to facilitate the identification of key influencing factors.</p>
</sec>
<sec id="sec16">
<label>2.6.1.2</label>
<title>Decision tree model (DT)</title>
<p>The decision tree model constructs a tree-like structure by recursively partitioning the feature space, resulting in an intuitive and easily interpretable model. In this study, a decision tree model was developed using the rpart package in R. The complexity parameter was set to 0.01 (cp&#x202F;=&#x202F;0.01) to control tree growth, the maximum tree depth was limited to 5 (maxdepth&#x202F;=&#x202F;5), and the minimum number of samples required for a node split was set to 20 (minsplit&#x202F;=&#x202F;20). In addition, 10-fold cross-validation was applied in the rpart framework to enable automatic cost-complexity pruning, and the subtree with the minimum cross-validation error was selected to mitigate overfitting.</p>
</sec>
<sec id="sec17">
<label>2.6.1.3</label>
<title>Neural network model (NN)</title>
<p>The neural network model was used to capture nonlinear relationships among variables. In this study, a single-hidden-layer neural network was constructed using the nnet package within the caret framework in R. The number of neurons in the hidden layer was set to 8 (size&#x202F;=&#x202F;8), and L2 regularization was applied with a decay parameter of 0.1 (decay&#x202F;=&#x202F;0.1) to mitigate overfitting. The maximum number of training iterations was set to 200 (maxit&#x202F;=&#x202F;200). During model training, parallel computing was enabled to improve computational efficiency, and model convergence was monitored throughout the training process.</p>
</sec>
<sec id="sec18">
<label>2.6.1.4</label>
<title>Na&#x00EF;ve Bayes model (NB)</title>
<p>The Na&#x00EF;ve Bayes model performs probabilistic inference based on Bayes&#x2019; theorem and is well suited for high-dimensional and small-sample datasets. In this study, the NB model was constructed using the e1071 package in R, with Laplace smoothing applied (laplace&#x202F;=&#x202F;1) to address zero-probability issues. For continuous variables, kernel density estimation was used by default to preserve the underlying distributional characteristics.</p>
</sec>
<sec id="sec19">
<label>2.6.1.5</label>
<title>Support vector machine model (SVM)</title>
<p>The support vector machine (SVM) model performs classification by constructing an optimal separating hyperplane and is particularly effective for handling nonlinear relationships. In this study, the SVM model was developed using the e1071 package in R with a radial basis function kernel (kernel&#x202F;=&#x202F;&#x201C;radial&#x201D;). The regularization parameter was set to 1 (cost&#x202F;=&#x202F;1), and the kernel parameter was set to 1 (gamma&#x202F;=&#x202F;1). Probability estimation was enabled (probability&#x202F;=&#x202F;TRUE) to generate individual predicted probabilities of WMSD occurrence.</p>
</sec>
<sec id="sec20">
<label>2.6.1.6</label>
<title>K-nearest neighbors model (K-NN)</title>
<p>The k-nearest neighbors (K-NN) algorithm is an instance-based, nonparametric supervised learning method. In this study, a K-NN classification model was constructed using the caret package in R. Continuous variables were centered and scaled prior to model training to eliminate the influence of scale differences, and Euclidean distance was used as the similarity metric. The optimal number of neighbors was selected through automated tuning (tuneLength&#x202F;=&#x202F;10). Model performance and generalizability were evaluated using 10-fold cross-validation.</p>
</sec>
<sec id="sec21">
<label>2.6.1.7</label>
<title>Stacking ensemble model</title>
<p>Ensemble learning was applied to improve the predictive accuracy and generalizability of the WMSD risk model. A stacking ensemble strategy was implemented, in which six heterogeneous machine learning algorithms (neural network, random forest, decision tree, Na&#x00EF;ve Bayes, support vector machine, and k-nearest neighbors) were used as first-level base learners and trained using the caret package in R. Model training employed three-fold cross-validation combined with five bootstrap resampling iterations to reduce overfitting, with the area under the receiver operating characteristic curve (AUC) used as the primary performance metric. Predicted probabilities from the base models were used as meta-features and integrated using a generalized linear model at the second level.</p>
</sec>
</sec>
<sec id="sec22">
<label>2.6.2</label>
<title>Validation and evaluation of predictive models</title>
<p>All models were trained and evaluated using the same training and test datasets. The dataset was randomly split into a training set (70%) and a test set (30%) using a fixed random seed (seed&#x202F;=&#x202F;123). Model training and parameter optimization were performed exclusively on the training set, while the test set was used solely for validation and performance evaluation. This approach was adopted to minimize overfitting and to ensure an unbiased assessment of model performance.</p>
<p>The predictive performance of the machine learning models was evaluated on the test dataset. The primary performance metric was the area under the receiver operating characteristic curve (AUC), and additional metrics, including accuracy, precision, recall, and F1-score, were also calculated. Accuracy, precision, recall, and F1-score were derived from the binary confusion matrix. Detailed definitions of the confusion matrix and calculation formulas for each metric are provided in the <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S4</xref> and <xref ref-type="supplementary-material" rid="SM1">Supplementary Equations 1&#x2013;4</xref>.</p>
<sec id="sec23">
<label>2.6.2.1</label>
<title>Accuracy</title>
<p>Accuracy refers to the proportion of correctly predicted samples out of the total number of samples. It serves as a fundamental metric for evaluating a model&#x2019;s overall performance and is suitable for datasets with balanced class distributions. However, when data exhibits class imbalance, accuracy may fail to fully reflect the model&#x2019;s actual performance.</p>
</sec>
<sec id="sec24">
<label>2.6.2.2</label>
<title>Precision</title>
<p>Accuracy refers to the proportion of samples predicted as positive cases by the model that are actually positive cases. Accuracy reflects the reliability of the model in predicting positive cases. In WMSD risk prediction, high accuracy means the model can reduce false positives, thereby lowering unnecessary intervention costs.</p>
</sec>
<sec id="sec25">
<label>2.6.2.3</label>
<title>Recall</title>
<p>Recall refers to the proportion of samples that are actually positive cases and are correctly predicted as positive by the model. Recall reflects the model&#x2019;s ability to identify positive case samples. In WMSD risk prediction, a high recall indicates that the model can identify as many high-risk workers as possible, avoiding underreporting and thereby reducing the risk of occupational disease occurrence.</p>
</sec>
<sec id="sec26">
<label>2.6.2.4</label>
<title>F1-score</title>
<p>F1 score is the harmonic mean of precision and recall, providing a balanced measure of both accuracy and sensitivity. It is particularly useful for evaluating model performance when positive and negative samples are imbalanced, offering a more comprehensive assessment. The F1 score is a synthetic metric that reflects the overall effectiveness of a model more accurately than precision or recall alone, especially when dealing with imbalanced data. It ranges from 0 to 1, with higher values indicating better performance in both precision and recall.</p>
</sec>
<sec id="sec27">
<label>2.6.2.5</label>
<title>Receiver operating characteristic curve and AUC</title>
<p>The ROC curve is a graph plotting the false positive rate (FPR) on the <italic>x</italic>-axis and the true positive rate (TPR) on the <italic>y</italic>-axis, illustrating the relationship between true positive and false positive rates. AUC refers to the Area Under the Receiver Operating Characteristic curve, i.e., the area beneath the ROC curve, with values ranging from 0 to 1. An AUC value of 0.5 indicates that the model&#x2019;s predictive capability is equivalent to random guessing, signifying poor predictive ability and no practical application value. An AUC value between 0.5 and 0.7 indicates average predictive performance; an AUC value &#x003E; 0.7 signifies good predictive performance with high practical value. AUC reflects the model&#x2019;s overall performance across different classification thresholds. The closer the AUC value is to 1, the stronger the model&#x2019;s classification capability.</p>
</sec>
</sec>
</sec>
</sec>
<sec sec-type="results" id="sec28">
<label>3</label>
<title>Results</title>
<sec id="sec29">
<label>3.1</label>
<title>Participant demographics</title>
<p>Of the 1,409 participants, 1,308 (92.8%) were male. The predominant age group was 30&#x2013;40&#x202F;years old (<italic>n</italic>&#x202F;=&#x202F;965, 58%). Most participants (<italic>n</italic>&#x202F;=&#x202F;783, 55.6%) had a normal BMI (18.5 to 25&#x202F;kg/m<sup>2</sup>), while 539 (38.2%) were classified as overweight (25&#x202F;kg/m<sup>2</sup> &#x2264;&#x202F;BMI&#x202F;&#x003C;&#x202F;30&#x202F;kg/m<sup>2</sup>) and 67 (4.8%) were classified as obesity (BMI&#x202F;&#x2265;&#x202F;30&#x202F;kg/m<sup>2</sup>). In terms of educational attainment, 808 (48.6%) of the participants had completed high school, 440 (26.4%) had completed junior college, and only 294 (17.7%) held a bachelor&#x2019;s degree. The majority had 10&#x2013;20&#x202F;years of work experience (<italic>n</italic>&#x202F;=&#x202F;877, 62.2%), followed by those with &#x003E;20&#x202F;years of service (<italic>n</italic>&#x202F;=&#x202F;314, 22.4%). Nearly half of the participants reported occasional physical activity (<italic>n</italic>&#x202F;=&#x202F;668, 47.4%), while 615 (43.6%) reported no regular exercise. Additional demographic characteristics are presented in <xref ref-type="table" rid="tab1">Table 1</xref>.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Demographic characteristics of the participants.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" colspan="2">Variables categories</th>
<th align="center" valign="top">
<italic>N</italic>
</th>
<th align="center" valign="top">Percentage (%)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top" rowspan="2">Gender</td>
<td align="left" valign="top">Male</td>
<td align="center" valign="top">1,308</td>
<td align="center" valign="top">92.8</td>
</tr>
<tr>
<td align="left" valign="middle">Female</td>
<td align="center" valign="middle">101</td>
<td align="center" valign="middle">7.2</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Age (years)</td>
<td align="left" valign="middle">20&#x202F;~&#x202F;30</td>
<td align="center" valign="middle">93</td>
<td align="center" valign="middle">6.6</td>
</tr>
<tr>
<td align="left" valign="middle">30&#x202F;~&#x202F;40</td>
<td align="center" valign="middle">812</td>
<td align="center" valign="middle">57.6</td>
</tr>
<tr>
<td align="left" valign="middle">40&#x202F;~&#x202F;50</td>
<td align="center" valign="middle">425</td>
<td align="center" valign="middle">30.2</td>
</tr>
<tr>
<td align="left" valign="middle">&#x003E;50</td>
<td align="center" valign="middle">79</td>
<td align="center" valign="middle">5.6</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Body Mass Index (kg/m<sup>2</sup>)</td>
<td align="left" valign="middle">&#x003C;18.5</td>
<td align="center" valign="middle">20</td>
<td align="center" valign="middle">1.4</td>
</tr>
<tr>
<td align="left" valign="middle">18.5&#x202F;~&#x202F;25</td>
<td align="center" valign="middle">783</td>
<td align="center" valign="middle">55.6</td>
</tr>
<tr>
<td align="left" valign="middle">25&#x202F;~&#x202F;30</td>
<td align="center" valign="middle">539</td>
<td align="center" valign="middle">38.2</td>
</tr>
<tr>
<td align="left" valign="middle">&#x2265;30</td>
<td align="center" valign="middle">67</td>
<td align="center" valign="middle">4.8</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Hand</td>
<td align="left" valign="middle">Right</td>
<td align="center" valign="middle">1,266</td>
<td align="center" valign="middle">89.9</td>
</tr>
<tr>
<td align="left" valign="middle">Left</td>
<td align="center" valign="middle">143</td>
<td align="center" valign="middle">10.1</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="5">Education</td>
<td align="left" valign="middle">Junior high school and below</td>
<td align="center" valign="middle">104</td>
<td align="center" valign="middle">7.4</td>
</tr>
<tr>
<td align="left" valign="middle">High school</td>
<td align="center" valign="middle">736</td>
<td align="center" valign="middle">52.2</td>
</tr>
<tr>
<td align="left" valign="middle">Junior college</td>
<td align="center" valign="middle">363</td>
<td align="center" valign="middle">25.8</td>
</tr>
<tr>
<td align="left" valign="middle">Bachelor degree</td>
<td align="center" valign="middle">202</td>
<td align="center" valign="middle">14.3</td>
</tr>
<tr>
<td align="left" valign="middle">Master degree or above</td>
<td align="center" valign="middle">4</td>
<td align="center" valign="middle">0.3</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Marital status</td>
<td align="left" valign="middle">Unmarried</td>
<td align="center" valign="middle">66</td>
<td align="center" valign="middle">4.7</td>
</tr>
<tr>
<td align="left" valign="middle">Married and living with spouse</td>
<td align="center" valign="middle">1,311</td>
<td align="center" valign="middle">93</td>
</tr>
<tr>
<td align="left" valign="middle">Married but separated</td>
<td align="center" valign="middle">32</td>
<td align="center" valign="middle">2.3</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Monthly income (RMB&#x002A;)</td>
<td align="left" valign="middle">&#x2264;3,000</td>
<td align="center" valign="middle">50</td>
<td align="center" valign="middle">3.5</td>
</tr>
<tr>
<td align="left" valign="middle">3,001&#x2013;5,000</td>
<td align="center" valign="middle">422</td>
<td align="center" valign="middle">30</td>
</tr>
<tr>
<td align="left" valign="middle">5,001&#x2013;10,000</td>
<td align="center" valign="middle">773</td>
<td align="center" valign="middle">54.9</td>
</tr>
<tr>
<td align="left" valign="middle">&#x003E;10,000</td>
<td align="center" valign="middle">164</td>
<td align="center" valign="middle">11.6</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="5">Physical exercise</td>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">615</td>
<td align="center" valign="middle">43.6</td>
</tr>
<tr>
<td align="left" valign="middle">Occasionally</td>
<td align="center" valign="middle">668</td>
<td align="center" valign="middle">47.4</td>
</tr>
<tr>
<td align="left" valign="middle">2&#x202F;~&#x202F;3 times/month</td>
<td align="center" valign="middle">27</td>
<td align="center" valign="middle">1.9</td>
</tr>
<tr>
<td align="left" valign="middle">1&#x202F;~&#x202F;2 times/week</td>
<td align="center" valign="middle">50</td>
<td align="center" valign="middle">3.5</td>
</tr>
<tr>
<td align="left" valign="middle">&#x003E;2 times/week</td>
<td align="center" valign="middle">49</td>
<td align="center" valign="middle">3.5</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Smoking behavior</td>
<td align="left" valign="middle">Non-smoker</td>
<td align="center" valign="middle">571</td>
<td align="center" valign="middle">40.5</td>
</tr>
<tr>
<td align="left" valign="middle">Occasional smoking</td>
<td align="center" valign="middle">361</td>
<td align="center" valign="middle">25.6</td>
</tr>
<tr>
<td align="left" valign="middle">Regular smoking</td>
<td align="center" valign="middle">433</td>
<td align="center" valign="middle">30.7</td>
</tr>
<tr>
<td align="left" valign="middle">Quit smoking</td>
<td align="center" valign="middle">44</td>
<td align="center" valign="middle">3.1</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="4">Length of service in this job category</td>
<td align="left" valign="middle">&#x003C;5</td>
<td align="center" valign="middle">415</td>
<td align="center" valign="middle">29.5</td>
</tr>
<tr>
<td align="left" valign="middle">5&#x202F;~&#x202F;10</td>
<td align="center" valign="middle">318</td>
<td align="center" valign="middle">22.6</td>
</tr>
<tr>
<td align="left" valign="middle">10&#x202F;~&#x202F;15</td>
<td align="center" valign="middle">351</td>
<td align="center" valign="middle">24.9</td>
</tr>
<tr>
<td align="left" valign="middle">&#x003E;15</td>
<td align="center" valign="middle">325</td>
<td align="center" valign="middle">23.1</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Length of employment</td>
<td align="left" valign="middle">&#x2264;10</td>
<td align="center" valign="middle">218</td>
<td align="center" valign="middle">15.5</td>
</tr>
<tr>
<td align="left" valign="middle">10&#x202F;~&#x202F;20</td>
<td align="center" valign="middle">877</td>
<td align="center" valign="middle">62.2</td>
</tr>
<tr>
<td align="left" valign="middle">&#x003E;20</td>
<td align="center" valign="middle">314</td>
<td align="center" valign="middle">22.3</td>
</tr>
<tr>
<td align="left" valign="middle" colspan="2">Total</td>
<td align="center" valign="middle">1,409</td>
<td align="center" valign="middle">100</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>&#x002A;RMB in table refers to Renminbi, the official legal currency of China.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec30">
<label>3.2</label>
<title>Prevalence of WMSD</title>
<p>In total, 1,156 (82%) participants reported experiencing work-related musculoskeletal pain or discomfort in the past 12&#x202F;months. Multisite (2 or more) WMSD were more prevalent (86.3%) than single-site (13.7%). The most commonly affected areas were the neck (59.5%), shoulder (53.4%) and low back (46.5%) (<xref ref-type="table" rid="tab2">Table 2</xref>).</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Prevalence of WMSD by body region.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Body parts</th>
<th align="center" valign="top">Positive case (n)</th>
<th align="center" valign="top">Prevalence (%)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Neck</td>
<td align="center" valign="middle">839</td>
<td align="center" valign="middle">59.5</td>
</tr>
<tr>
<td align="left" valign="middle">Shoulder</td>
<td align="center" valign="middle">752</td>
<td align="center" valign="middle">53.4</td>
</tr>
<tr>
<td align="left" valign="middle">Upper back</td>
<td align="center" valign="middle">377</td>
<td align="center" valign="middle">26.8</td>
</tr>
<tr>
<td align="left" valign="middle">Low back</td>
<td align="center" valign="middle">655</td>
<td align="center" valign="middle">46.5</td>
</tr>
<tr>
<td align="left" valign="middle">Elbow</td>
<td align="center" valign="middle">571</td>
<td align="center" valign="middle">40.5</td>
</tr>
<tr>
<td align="left" valign="middle">Wrist/hand</td>
<td align="center" valign="middle">620</td>
<td align="center" valign="middle">44</td>
</tr>
<tr>
<td align="left" valign="middle">Hip/Thigh</td>
<td align="center" valign="middle">484</td>
<td align="center" valign="middle">34.4</td>
</tr>
<tr>
<td align="left" valign="middle">Knee</td>
<td align="center" valign="middle">598</td>
<td align="center" valign="middle">42.4</td>
</tr>
<tr>
<td align="left" valign="middle">Ankle/foot</td>
<td align="center" valign="middle">485</td>
<td align="center" valign="middle">34.4</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec31">
<label>3.3</label>
<title>Occupational risk factor</title>
<sec id="sec32">
<label>3.3.1</label>
<title>Univariate analysis</title>
<p>Univariate analyses were performed using Pearson&#x2019;s <italic>&#x03C7;</italic><sup>2</sup> test and the <italic>&#x03C7;</italic><sup>2</sup> test for trend on 9 demographic variables and 49 work-related variables to identify variables associated with work-related musculoskeletal disorders (WMSDs). The results for demographic characteristics are summarized in <xref ref-type="table" rid="tab3">Table 3</xref>, and the complete univariate analysis results are presented in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S1</xref>. The <italic>&#x03C7;</italic><sup>2</sup> test results indicated that, among individual-level factors, employment length was significantly associated with WMSD prevalence, with the risk increasing as years of employment increased. Married workers exhibited a higher prevalence of WMSDs than unmarried workers. In addition, workers who regularly engaged in physical activity had a lower prevalence of WMSDs compared with those who did not or only rarely participated in physical activity. Regular smokers showed a higher prevalence of WMSDs than non-smokers, occasional smokers, and former smokers. In contrast, sex, age, body mass index (BMI), educational level, and monthly income were not significantly associated with WMSD occurrence.</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Comparison of WMSD with different demographic characteristics.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Factors</th>
<th align="center" valign="top">
<italic>N</italic>
</th>
<th align="center" valign="top">Positive case (n)</th>
<th align="center" valign="top">Prevalence (%)</th>
<th align="center" valign="top">
<italic>&#x03C7;</italic>
<sup>2</sup>
</th>
<th align="center" valign="top">
<italic>P</italic>
</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" colspan="6">Length of service in this job category</td>
</tr>
<tr>
<td align="left" valign="middle">&#x003C;5</td>
<td align="center" valign="middle">415</td>
<td align="center" valign="middle">325</td>
<td align="center" valign="middle">78.3</td>
<td align="char" valign="middle" char=".">10.793</td>
<td align="char" valign="middle" char=".">0.013</td>
</tr>
<tr>
<td align="left" valign="middle">5&#x202F;~&#x202F;10</td>
<td align="center" valign="middle">318</td>
<td align="center" valign="middle">253</td>
<td align="center" valign="middle">79.6</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">10&#x202F;~&#x202F;15</td>
<td align="center" valign="middle">351</td>
<td align="center" valign="middle">299</td>
<td align="center" valign="middle">85.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">&#x003E;15</td>
<td align="center" valign="middle">325</td>
<td align="center" valign="middle">279</td>
<td align="center" valign="middle">85.8</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Length of employment</td>
</tr>
<tr>
<td align="left" valign="middle">&#x2264;10</td>
<td align="center" valign="middle">218</td>
<td align="center" valign="middle">152</td>
<td align="center" valign="middle">69.7</td>
<td align="char" valign="middle" char=".">28.592</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">10&#x202F;~&#x202F;20</td>
<td align="center" valign="middle">877</td>
<td align="center" valign="middle">731</td>
<td align="center" valign="middle">83.4</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">&#x003E;20</td>
<td align="center" valign="middle">314</td>
<td align="center" valign="middle">273</td>
<td align="center" valign="middle">86.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Marital status</td>
</tr>
<tr>
<td align="left" valign="middle">Unmarried</td>
<td align="center" valign="middle">66</td>
<td align="center" valign="middle">43</td>
<td align="center" valign="middle">62.5</td>
<td align="char" valign="middle" char=".">13.471</td>
<td align="char" valign="middle" char=".">0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Married and living with spouse</td>
<td align="center" valign="middle">1,311</td>
<td align="center" valign="middle">1,087</td>
<td align="center" valign="middle">82.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Married but separated</td>
<td align="center" valign="middle">32</td>
<td align="center" valign="middle">26</td>
<td align="center" valign="middle">81.25</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Physical exercise</td>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">615</td>
<td align="center" valign="middle">534</td>
<td align="center" valign="middle">86.8</td>
<td align="char" valign="middle" char=".">20.812</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Occasionally</td>
<td align="center" valign="middle">668</td>
<td align="center" valign="middle">527</td>
<td align="center" valign="middle">78.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">2&#x202F;~&#x202F;3times/month</td>
<td align="center" valign="middle">27</td>
<td align="center" valign="middle">23</td>
<td align="center" valign="middle">85.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">1&#x202F;~&#x202F;2times/week</td>
<td align="center" valign="middle">50</td>
<td align="center" valign="middle">38</td>
<td align="center" valign="middle">76</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">&#x003E; 2 times/week</td>
<td align="center" valign="middle">49</td>
<td align="center" valign="middle">34</td>
<td align="center" valign="middle">69.4</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Smoking behavior</td>
</tr>
<tr>
<td align="left" valign="middle">Non-smoker</td>
<td align="center" valign="middle">571</td>
<td align="center" valign="middle">455</td>
<td align="center" valign="middle">79.7</td>
<td align="char" valign="middle" char=".">14.111</td>
<td align="char" valign="middle" char=".">0.003</td>
</tr>
<tr>
<td align="left" valign="middle">Occasional</td>
<td align="center" valign="middle">361</td>
<td align="center" valign="middle">285</td>
<td align="center" valign="middle">78.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Regular</td>
<td align="center" valign="middle">433</td>
<td align="center" valign="middle">380</td>
<td align="center" valign="middle">87.8</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Quit smoking</td>
<td align="center" valign="middle">44</td>
<td align="center" valign="middle">36</td>
<td align="center" valign="middle">81.8</td>
<td/>
<td/>
</tr>
</tbody>
</table>
</table-wrap>
<p>In addition, the occurrence of WMSDs was significantly associated with multiple work-related factors, including perceived health status, prolonged standing, prolonged kneeling, prolonged trunk bending, prolonged neck flexion, prolonged knee bending, high-frequency repetitive operations per minute, frequent repetition of the same back movements, repetitive wrist flexion/extension, uncomfortable working postures, repetitive operations performed multiple times per minute, carrying heavy loads (more than 20&#x202F;kg per lift), operating with hands or arms, overtime work, feeling cold at work, exposure to wind or temperature changes in the working environment, and insufficient rest time. For example, workers who frequently stood for long periods during work had a markedly higher prevalence of WMSDs than those in other work categories, whereas workers who rarely or never stood for prolonged periods had a lower prevalence of WMSDs. To improve clarity and conciseness, <xref ref-type="table" rid="tab4">Table 4</xref> presents only variables with <italic>p</italic> values less than 0.001 in the univariate analyses. The complete results of the <italic>&#x03C7;</italic><sup>2</sup> tests for all work-related variables are provided in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S2</xref>.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Comparison of WMSD with different work-related factors.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Factors</th>
<th align="center" valign="top">
<italic>N</italic>
</th>
<th align="center" valign="top">Positive case</th>
<th align="center" valign="top">Prevalence (%)</th>
<th align="center" valign="top">
<italic>&#x03C7;</italic>
<sup>2</sup>
</th>
<th align="center" valign="top">
<italic>P</italic>
</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" colspan="6">Perceived health status</td>
</tr>
<tr>
<td align="left" valign="middle">Perfect</td>
<td align="center" valign="middle">462</td>
<td align="center" valign="middle">308</td>
<td align="center" valign="middle">66.7</td>
<td align="char" valign="middle" char=".">111.438</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Fine</td>
<td align="center" valign="middle">832</td>
<td align="center" valign="middle">741</td>
<td align="center" valign="middle">89.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Poor</td>
<td align="center" valign="middle">103</td>
<td align="center" valign="middle">96</td>
<td align="center" valign="middle">93.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Very poor</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="middle">11</td>
<td align="center" valign="middle">91.7</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Keep standing for long hours</td>
</tr>
<tr>
<td align="left" valign="middle">Never</td>
<td align="center" valign="middle">236</td>
<td align="center" valign="middle">181</td>
<td align="center" valign="middle">76.7</td>
<td align="char" valign="middle" char=".">38.375</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Occasionally</td>
<td align="center" valign="middle">253</td>
<td align="center" valign="middle">185</td>
<td align="center" valign="middle">73.1</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Frequently</td>
<td align="center" valign="middle">362</td>
<td align="center" valign="middle">292</td>
<td align="center" valign="middle">80.7</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Very Frequently</td>
<td align="center" valign="middle">558</td>
<td align="center" valign="middle">498</td>
<td align="center" valign="middle">89.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">743</td>
<td align="center" valign="middle">577</td>
<td align="center" valign="middle">77.7</td>
<td align="char" valign="middle" char=".">20.525</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="center" valign="middle">666</td>
<td align="center" valign="middle">579</td>
<td align="center" valign="middle">86.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Keep bowing the head for long hours</td>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">786</td>
<td align="center" valign="middle">603</td>
<td align="center" valign="middle">76.7</td>
<td align="char" valign="middle" char=".">34.235</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="center" valign="middle">623</td>
<td align="center" valign="middle">553</td>
<td align="center" valign="middle">88.8</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Keep bending knees for long hours</td>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">751</td>
<td align="center" valign="middle">582</td>
<td align="center" valign="middle">77.5</td>
<td align="char" valign="middle" char=".">22.573</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="center" valign="middle">658</td>
<td align="center" valign="middle">574</td>
<td align="center" valign="middle">87.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Repeat operation many times a working minute</td>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">594</td>
<td align="center" valign="middle">438</td>
<td align="center" valign="middle">73.7</td>
<td align="char" valign="middle" char=".">48.099</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="center" valign="middle">815</td>
<td align="center" valign="middle">718</td>
<td align="center" valign="middle">88.1</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Frequent repetition of the same movement on the back</td>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">459</td>
<td align="center" valign="middle">340</td>
<td align="center" valign="middle">74.1</td>
<td align="char" valign="middle" char=".">29.353</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="center" valign="middle">950</td>
<td align="center" valign="middle">816</td>
<td align="center" valign="middle">85.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Bending wrist up/down</td>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">403</td>
<td align="center" valign="middle">292</td>
<td align="center" valign="middle">72.5</td>
<td align="char" valign="middle" char=".">35.218</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="center" valign="middle">1,006</td>
<td align="center" valign="middle">864</td>
<td align="center" valign="middle">85.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Work in uncomfortable postures</td>
</tr>
<tr>
<td align="left" valign="middle">Never</td>
<td align="center" valign="middle">359</td>
<td align="center" valign="middle">251</td>
<td align="center" valign="middle">69.9</td>
<td align="char" valign="middle" char=".">65.717</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Occasionally</td>
<td align="center" valign="middle">528</td>
<td align="center" valign="middle">429</td>
<td align="center" valign="middle">81.3</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Frequently</td>
<td align="center" valign="middle">333</td>
<td align="center" valign="middle">303</td>
<td align="center" valign="middle">91</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Very Frequently</td>
<td align="center" valign="middle">189</td>
<td align="center" valign="middle">173</td>
<td align="center" valign="middle">91.5</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Operate repetitively for multiple times per minute</td>
</tr>
<tr>
<td align="left" valign="middle">Never</td>
<td align="center" valign="middle">281</td>
<td align="center" valign="middle">203</td>
<td align="center" valign="middle">72.2</td>
<td align="char" valign="middle" char=".">56.769</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Occasionally</td>
<td align="center" valign="middle">429</td>
<td align="center" valign="middle">327</td>
<td align="center" valign="middle">76.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Frequently</td>
<td align="center" valign="middle">395</td>
<td align="center" valign="middle">347</td>
<td align="center" valign="middle">87.8</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Very Frequently</td>
<td align="center" valign="middle">304</td>
<td align="center" valign="middle">279</td>
<td align="center" valign="middle">91.8</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Carry heavy objects (more than 20&#x202F;kg each time)</td>
</tr>
<tr>
<td align="left" valign="middle">Never</td>
<td align="center" valign="middle">355</td>
<td align="center" valign="middle">262</td>
<td align="center" valign="middle">73.8</td>
<td align="char" valign="middle" char=".">34.335</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Occasionally</td>
<td align="center" valign="middle">433</td>
<td align="center" valign="middle">346</td>
<td align="center" valign="middle">79.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Frequently</td>
<td align="center" valign="middle">331</td>
<td align="center" valign="middle">289</td>
<td align="center" valign="middle">87.3</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Very Frequently</td>
<td align="center" valign="middle">290</td>
<td align="center" valign="middle">259</td>
<td align="center" valign="middle">89.3</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Operate with hands or arms</td>
</tr>
<tr>
<td align="left" valign="middle">Never</td>
<td align="center" valign="middle">224</td>
<td align="center" valign="middle">166</td>
<td align="center" valign="middle">74.1</td>
<td align="char" valign="middle" char=".">46.305</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Occasionally</td>
<td align="center" valign="middle">289</td>
<td align="center" valign="middle">210</td>
<td align="center" valign="middle">72.7</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Frequently</td>
<td align="center" valign="middle">419</td>
<td align="center" valign="middle">353</td>
<td align="center" valign="middle">84.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Very Frequently</td>
<td align="center" valign="middle">477</td>
<td align="center" valign="middle">427</td>
<td align="center" valign="middle">89.5</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Overtime work</td>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">725</td>
<td align="center" valign="middle">549</td>
<td align="center" valign="middle">75.7</td>
<td align="char" valign="middle" char=".">40.49</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="center" valign="middle">684</td>
<td align="center" valign="middle">607</td>
<td align="center" valign="middle">88.7</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle" colspan="6">Feeling cold, wind or temperature change at work</td>
</tr>
<tr>
<td align="left" valign="middle">No</td>
<td align="center" valign="middle">283</td>
<td align="center" valign="middle">192</td>
<td align="center" valign="middle">67.8</td>
<td align="char" valign="middle" char=".">48.467</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="center" valign="middle">1,126</td>
<td align="center" valign="middle">964</td>
<td align="center" valign="top">85.6</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Enough rest time</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">939</td>
<td align="center" valign="top">832</td>
<td align="center" valign="top">88.6</td>
<td align="char" valign="top" char=".">82.252</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">470</td>
<td align="center" valign="top">324</td>
<td align="center" valign="top">68.9</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Back position</td>
</tr>
<tr>
<td align="left" valign="top">Upright</td>
<td align="center" valign="top">492</td>
<td align="center" valign="top">372</td>
<td align="center" valign="top">75.6</td>
<td align="char" valign="top" char=".">22.52</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Slightly curved</td>
<td align="center" valign="top">591</td>
<td align="center" valign="top">499</td>
<td align="center" valign="top">75.6</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">Substantial bending</td>
<td align="center" valign="top">326</td>
<td align="center" valign="top">285</td>
<td align="center" valign="top">87.4</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Neck position</td>
</tr>
<tr>
<td align="left" valign="top">Upright</td>
<td align="center" valign="top">460</td>
<td align="center" valign="top">339</td>
<td align="center" valign="top">73.7</td>
<td align="char" valign="top" char=".">35.701</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Slightly forward leaning</td>
<td align="center" valign="top">601</td>
<td align="center" valign="top">507</td>
<td align="center" valign="top">84.4</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">Large forward lean</td>
<td align="center" valign="top">272</td>
<td align="center" valign="top">243</td>
<td align="center" valign="top">89.3</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">Head tilted back</td>
<td align="center" valign="top">76</td>
<td align="center" valign="top">67</td>
<td align="center" valign="top">88.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Keep the neck in the same position for long hours</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">613</td>
<td align="center" valign="top">475</td>
<td align="center" valign="top">77.5</td>
<td align="char" valign="top" char=".">15.29</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">796</td>
<td align="center" valign="top">681</td>
<td align="center" valign="top">85.6</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Keep turning the head for long hours</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">889</td>
<td align="center" valign="top">702</td>
<td align="center" valign="top">79</td>
<td align="char" valign="top" char=".">15.5</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">520</td>
<td align="center" valign="top">454</td>
<td align="center" valign="top">87.3</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Keep wrist flexion for long hours</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">623</td>
<td align="center" valign="top">471</td>
<td align="center" valign="top">75.6</td>
<td align="char" valign="top" char=".">31.461</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">786</td>
<td align="center" valign="top">685</td>
<td align="center" valign="top">87.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">495</td>
<td align="center" valign="top">377</td>
<td align="center" valign="top">76.2</td>
<td align="char" valign="top" char=".">17.923</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">914</td>
<td align="center" valign="top">779</td>
<td align="center" valign="top">85.2</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Lower extremities do the same movement frequently</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">610</td>
<td align="center" valign="top">465</td>
<td align="center" valign="top">76.2</td>
<td align="char" valign="top" char=".">24.687</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">799</td>
<td align="center" valign="top">691</td>
<td align="center" valign="top">86.5</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Turn around often</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">358</td>
<td align="center" valign="top">270</td>
<td align="center" valign="top">75.4</td>
<td align="char" valign="top" char=".">14.299</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">1,051</td>
<td align="center" valign="top">886</td>
<td align="center" valign="top">84.3</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Carry heavy objects (more than 5&#x202F;kg each time)</td>
</tr>
<tr>
<td align="left" valign="top">Never</td>
<td align="center" valign="top">297</td>
<td align="center" valign="top">228</td>
<td align="center" valign="top">76.8</td>
<td align="char" valign="top" char=".">31.076</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Occasionally</td>
<td align="center" valign="top">376</td>
<td align="center" valign="top">288</td>
<td align="center" valign="top">76.6</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">Frequently</td>
<td align="center" valign="top">356</td>
<td align="center" valign="top">297</td>
<td align="center" valign="top">83.4</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">Very frequently</td>
<td align="center" valign="top">380</td>
<td align="center" valign="top">343</td>
<td align="center" valign="top">90.3</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Holding onto something in hand</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">266</td>
<td align="center" valign="top">189</td>
<td align="center" valign="top">71.1</td>
<td align="char" valign="top" char=".">26.89</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">1,143</td>
<td align="center" valign="top">967</td>
<td align="center" valign="top">84.6</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Shortage of staff in the sector</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">429</td>
<td align="center" valign="top">302</td>
<td align="center" valign="top">70.4</td>
<td align="char" valign="top" char=".">56.803</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">980</td>
<td align="center" valign="top">854</td>
<td align="center" valign="top">87.1</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Work for someone else</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">972</td>
<td align="center" valign="top">774</td>
<td align="center" valign="top">79.6</td>
<td align="char" valign="top" char=".">12.401</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">437</td>
<td align="center" valign="top">382</td>
<td align="center" valign="top">87.4</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Use vibrator at work</td>
</tr>
<tr>
<td align="left" valign="top">Never</td>
<td align="center" valign="top">456</td>
<td align="center" valign="top">350</td>
<td align="center" valign="top">76.8</td>
<td align="char" valign="top" char=".">26.438</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Occasionally</td>
<td align="center" valign="top">425</td>
<td align="center" valign="top">338</td>
<td align="center" valign="top">79.5</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">Frequently</td>
<td align="center" valign="top">279</td>
<td align="center" valign="top">250</td>
<td align="center" valign="top">89.6</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">Very Frequently</td>
<td align="center" valign="top">249</td>
<td align="center" valign="top">218</td>
<td align="center" valign="top">87.6</td>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top" colspan="6">Wrist on the edge of hard, angular objects</td>
</tr>
<tr>
<td align="left" valign="top">No</td>
<td align="center" valign="top">728</td>
<td align="center" valign="top">567</td>
<td align="center" valign="top">77.9</td>
<td align="char" valign="top" char=".">17.689</td>
<td align="char" valign="top" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="top">Yes</td>
<td align="center" valign="top">681</td>
<td align="center" valign="top">589</td>
<td align="center" valign="top">86.5</td>
<td/>
<td/>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec33">
<label>3.3.2</label>
<title>Multivariate logistic regression screening for influential factors</title>
<p>Eight variables were identified as independent predictors of WMSDs. Seven determinants were associated with WSMD:</p>
<list list-type="bullet">
<list-item>
<p>Smoking (OR&#x202F;=&#x202F;1.583; 95% CI: 1.039&#x2013;2.412)</p>
</list-item>
<list-item>
<p>Frequent multiple repetitive operations (OR&#x202F;=&#x202F;1.672; 95% CI: 1.161&#x2013;2.410)</p>
</list-item>
<list-item>
<p>Prolonged head-down posture (OR&#x202F;=&#x202F;1.639; 95% CI: 1.039&#x2013;2.584)</p>
</list-item>
<list-item>
<p>Uncomfortable working postures (OR&#x202F;=&#x202F;1.912; 95% CI: 1.184&#x2013;3.088)</p>
</list-item>
<list-item>
<p>Prolonged knee bending (OR&#x202F;=&#x202F;1.531; 95% CI: 1.002&#x2013;2.339)</p>
</list-item>
<list-item>
<p>Employed &#x003E;20&#x202F;years (OR&#x202F;=&#x202F;2.364; 95% CI: 1.300&#x2013;4.300)</p>
</list-item>
<list-item>
<p>Self-perceived poor health status (OR&#x202F;=&#x202F;4.034; 95% CI: 1.680&#x2013;9.688)</p>
</list-item>
</list>
<p>Having sufficient rest time appeared to be a protective factor against WMSD (OR&#x202F;=&#x202F;0.518; 95% CI: 0.355&#x2013;0.757). Results are summarized in <xref ref-type="table" rid="tab5">Table 5</xref>.</p>
<table-wrap position="float" id="tab5">
<label>Table 5</label>
<caption>
<p>Results of multivariate logistic regression describing the relationship between personal and work-related factors with WMSD.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" colspan="2" rowspan="2">Factors</th>
<th align="center" valign="top" rowspan="2">ORs</th>
<th align="center" valign="top" colspan="2">95%CI</th>
<th align="center" valign="top" rowspan="2">
<italic>P</italic>
</th>
</tr>
<tr>
<th align="center" valign="top">Lower</th>
<th align="center" valign="top">Upper</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="2">Smoking behavior</td>
<td align="left" valign="middle">No</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Regular</td>
<td align="char" valign="middle" char=".">1.583</td>
<td align="char" valign="middle" char=".">1.039</td>
<td align="char" valign="middle" char=".">2.412</td>
<td align="char" valign="middle" char=".">0.033</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Perceived health status</td>
<td align="left" valign="middle">Perfect</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Fine</td>
<td align="char" valign="middle" char=".">2.895</td>
<td align="char" valign="middle" char=".">2.048</td>
<td align="char" valign="middle" char=".">4.093</td>
<td align="char" valign="middle" char=".">&#x003C;0.001</td>
</tr>
<tr>
<td align="left" valign="middle">Poor</td>
<td align="char" valign="middle" char=".">4.034</td>
<td align="char" valign="middle" char=".">1.68</td>
<td align="char" valign="middle" char=".">9.688</td>
<td align="char" valign="middle" char=".">0.002</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Work in uncomfortable postures</td>
<td align="left" valign="middle">Never</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Occasionally</td>
<td align="char" valign="middle" char=".">1.912</td>
<td align="char" valign="middle" char=".">1.184</td>
<td align="char" valign="middle" char=".">3.088</td>
<td align="char" valign="middle" char=".">0.008</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Repeat operation many times a working minute</td>
<td align="left" valign="middle">No</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="char" valign="middle" char=".">1.672</td>
<td align="char" valign="middle" char=".">1.161</td>
<td align="char" valign="middle" char=".">2.41</td>
<td align="char" valign="middle" char=".">0.006</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Enough rest time</td>
<td align="left" valign="middle">No</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="char" valign="middle" char=".">0.518</td>
<td align="char" valign="middle" char=".">0.355</td>
<td align="char" valign="middle" char=".">0.757</td>
<td align="char" valign="middle" char=".">0.001</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Keep bowing the head for long hours</td>
<td align="left" valign="middle">No</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="char" valign="middle" char=".">1.639</td>
<td align="char" valign="middle" char=".">1.039</td>
<td align="char" valign="middle" char=".">2.584</td>
<td align="char" valign="middle" char=".">0.034</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Keep bending knees for long hours</td>
<td align="left" valign="middle">No</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">Yes</td>
<td align="char" valign="middle" char=".">1.531</td>
<td align="char" valign="middle" char=".">1.002</td>
<td align="char" valign="middle" char=".">2.339</td>
<td align="char" valign="middle" char=".">0.049</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Length of employment (years)</td>
<td align="left" valign="middle">&#x003C;10</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="middle">&#x003E;20</td>
<td align="char" valign="middle" char=".">2.364</td>
<td align="char" valign="middle" char=".">1.3</td>
<td align="char" valign="middle" char=".">4.3</td>
<td align="char" valign="middle" char=".">0.005</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Although sex and age did not reach statistical significance in the univariate analyses, both variables may act as potential confounders influencing the associations between multiple predictors and WMSD prevalence. To assess the potential confounding effects of age and sex, we conducted a sensitivity analysis by adding these two variables to the multivariable logistic regression model. The inclusion of age and sex did not materially alter the direction or magnitude of the main associations. The full results of this analysis are presented in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table S3</xref>.</p>
</sec>
</sec>
<sec id="sec34">
<label>3.4</label>
<title>Construction of a risk prediction model for WMSD</title>
<sec id="sec35">
<label>3.4.1</label>
<title>Construction and validation of a single model</title>
<p>The eight identified determinants included in the six machine learning models are: length of employment (years), smoking behavior, perceived health status, working in uncomfortable postures, repetitive operation, rest time, duration of a head bow, and knee bend. The comparison of the individual model&#x2019;s accuracy, precision, recall, F1 score and AUC are presented in <xref ref-type="table" rid="tab6">Tables 6</xref>&#x2013;<xref ref-type="table" rid="tab10">10</xref> and <xref ref-type="fig" rid="fig1">Figure 1</xref>. In summary, the NN model has the highest AUC (0.886 training, 0.704 test), strong precision and F1 score. The NB model has stable performance across metrics. The RF model has high accuracy but lower recall in the test set. The SVM model reported high precision but inconsistent recall. The DT and K-NN models had moderate performance.</p>
<table-wrap position="float" id="tab6">
<label>Table 6</label>
<caption>
<p>Comparison of the accuracy of the training and test sets of the six models.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Algorithm</th>
<th align="center" valign="top" colspan="2">Training set</th>
<th align="center" valign="top" colspan="2">Test set</th>
</tr>
<tr>
<th align="center" valign="top">Mean</th>
<th align="center" valign="top">95%CI</th>
<th align="center" valign="top">Mean</th>
<th align="center" valign="top">95%CI</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Random forest</td>
<td align="char" valign="middle" char=".">0.909</td>
<td align="center" valign="middle">(0.889, 0.926)</td>
<td align="char" valign="middle" char=".">0.809</td>
<td align="center" valign="middle">(0.755, 0.834)</td>
</tr>
<tr>
<td align="left" valign="middle">Decision tree</td>
<td align="char" valign="middle" char=".">0.838</td>
<td align="center" valign="middle">(0.813, 0.860)</td>
<td align="char" valign="middle" char=".">0.846</td>
<td align="center" valign="middle">(0.808, 0.879)</td>
</tr>
<tr>
<td align="left" valign="middle">Na&#x00EF;ve Bayes</td>
<td align="char" valign="middle" char=".">0.779</td>
<td align="center" valign="middle">(0.752, 0.805)</td>
<td align="char" valign="middle" char=".">0.768</td>
<td align="center" valign="middle">(0.725, 0.808)</td>
</tr>
<tr>
<td align="left" valign="middle">Neural network</td>
<td align="char" valign="middle" char=".">0.865</td>
<td align="center" valign="middle">(0.842, 0.886)</td>
<td align="char" valign="middle" char=".">0.839</td>
<td align="center" valign="middle">(0.801, 0.873)</td>
</tr>
<tr>
<td align="left" valign="middle">Support vector machines</td>
<td align="char" valign="middle" char=".">0.909</td>
<td align="center" valign="middle">(0.889, 0.926)</td>
<td align="char" valign="middle" char=".">0.801</td>
<td align="center" valign="middle">(0.260, 0.838)</td>
</tr>
<tr>
<td align="left" valign="middle">K-nearest neighbors</td>
<td align="char" valign="middle" char=".">0.837</td>
<td align="center" valign="middle">(0.812, 0.859)</td>
<td align="char" valign="middle" char=".">0.837</td>
<td align="center" valign="middle">(0.783, 0.858)</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="tab7">
<label>Table 7</label>
<caption>
<p>Comparison of the precision of the training and test sets of the six models.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Algorithm</th>
<th align="center" valign="top">Training set</th>
<th align="center" valign="top">Test set</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Random forest</td>
<td align="char" valign="middle" char=".">0.966</td>
<td align="char" valign="middle" char=".">0.918</td>
</tr>
<tr>
<td align="left" valign="middle">Decision tree</td>
<td align="char" valign="middle" char=".">0.963</td>
<td align="char" valign="middle" char=".">0.960</td>
</tr>
<tr>
<td align="left" valign="middle">Na&#x00EF;ve Bayes</td>
<td align="char" valign="middle" char=".">0.811</td>
<td align="char" valign="middle" char=".">0.816</td>
</tr>
<tr>
<td align="left" valign="middle">Neural network</td>
<td align="char" valign="middle" char=".">0.966</td>
<td align="char" valign="middle" char=".">0.949</td>
</tr>
<tr>
<td align="left" valign="middle">Support vector machines</td>
<td align="char" valign="middle" char=".">0.983</td>
<td align="char" valign="middle" char=".">0.938</td>
</tr>
<tr>
<td align="left" valign="middle">K-nearest neighbors</td>
<td align="char" valign="middle" char=".">0.953</td>
<td align="char" valign="middle" char=".">0.949</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="tab8">
<label>Table 8</label>
<caption>
<p>Comparison of the recall value of the training and test sets of the six models.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Algorithm</th>
<th align="center" valign="top">Training set</th>
<th align="center" valign="top">Test set</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Random forest</td>
<td align="char" valign="middle" char=".">0.658</td>
<td align="char" valign="middle" char=".">0.246</td>
</tr>
<tr>
<td align="left" valign="middle">Decision tree</td>
<td align="char" valign="middle" char=".">0.293</td>
<td align="char" valign="middle" char=".">0.261</td>
</tr>
<tr>
<td align="left" valign="middle">Na&#x00EF;ve Bayes</td>
<td align="char" valign="middle" char=".">0.641</td>
<td align="char" valign="middle" char=".">0.522</td>
</tr>
<tr>
<td align="left" valign="middle">Neural network</td>
<td align="char" valign="middle" char=".">0.424</td>
<td align="char" valign="middle" char=".">0.275</td>
</tr>
<tr>
<td align="left" valign="middle">Support vector machines</td>
<td align="char" valign="middle" char=".">0.587</td>
<td align="char" valign="middle" char=".">0.101</td>
</tr>
<tr>
<td align="left" valign="middle">K-nearest neighbors</td>
<td align="char" valign="middle" char=".">0.332</td>
<td align="char" valign="middle" char=".">0.261</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="tab9">
<label>Table 9</label>
<caption>
<p>Comparison of the F1-score of the training and test sets of the six models.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Algorithm</th>
<th align="center" valign="top">Training set</th>
<th align="center" valign="top">Test set</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Random forest</td>
<td align="char" valign="middle" char=".">0.783</td>
<td align="char" valign="middle" char=".">0.389</td>
</tr>
<tr>
<td align="left" valign="middle">Decision tree</td>
<td align="char" valign="middle" char=".">0.450</td>
<td align="char" valign="middle" char=".">0.410</td>
</tr>
<tr>
<td align="left" valign="middle">Na&#x00EF;ve Bayes</td>
<td align="char" valign="middle" char=".">0.716</td>
<td align="char" valign="middle" char=".">0.637</td>
</tr>
<tr>
<td align="left" valign="middle">Neural network</td>
<td align="char" valign="middle" char=".">0.589</td>
<td align="char" valign="middle" char=".">0.427</td>
</tr>
<tr>
<td align="left" valign="middle">Support vector machines</td>
<td align="char" valign="middle" char=".">0.735</td>
<td align="char" valign="middle" char=".">0.183</td>
</tr>
<tr>
<td align="left" valign="middle">K-nearest neighbors</td>
<td align="char" valign="middle" char=".">0.492</td>
<td align="char" valign="middle" char=".">0.409</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="tab10">
<label>Table 10</label>
<caption>
<p>Comparison of the AUC of the training and test sets of the six models.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Algorithm</th>
<th align="center" valign="top">Training set</th>
<th align="center" valign="top">Test set</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Random forest</td>
<td align="char" valign="middle" char=".">0.812</td>
<td align="char" valign="middle" char=".">0.581</td>
</tr>
<tr>
<td align="left" valign="middle">Decision tree</td>
<td align="char" valign="middle" char=".">0.628</td>
<td align="char" valign="middle" char=".">0.611</td>
</tr>
<tr>
<td align="left" valign="middle">Na&#x00EF;ve Bayes</td>
<td align="char" valign="middle" char=".">0.726</td>
<td align="char" valign="middle" char=".">0.669</td>
</tr>
<tr>
<td align="left" valign="middle">Neural network</td>
<td align="char" valign="middle" char=".">0.886</td>
<td align="char" valign="middle" char=".">0.704</td>
</tr>
<tr>
<td align="left" valign="middle">Support vector machines</td>
<td align="char" valign="middle" char=".">0.785</td>
<td align="char" valign="middle" char=".">0.520</td>
</tr>
<tr>
<td align="left" valign="middle">K-nearest neighbors</td>
<td align="char" valign="middle" char=".">0.642</td>
<td align="char" valign="middle" char=".">0.576</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>ROC curves for six base models: <bold>(A)</bold> ROC curve for training set and <bold>(B)</bold> ROC curve for test set.</p>
</caption>
<graphic xlink:href="fpubh-14-1729879-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">Multiple model ROC curves are shown to compare classification performances. Image A shows ROC curves with AUC values: NN 0.886, DT 0.628, RF 0.812, K-NN 0.642, NB 0.726, SVM 0.785. Image B shows ROC curves with AUC values: NN 0.704, DT 0.611, RF 0.581, K-NN 0.576, NB 0.669, SVM 0.520. Sensitivity is plotted against specificity, with a diagonal reference line for comparison.</alt-text>
</graphic>
</fig>
</sec>
<sec id="sec36">
<label>3.4.2</label>
<title>Ensemble model</title>
<p>To enhance the overall predictive accuracy of the individual models, a stacking ensemble model was constructed using the six individual models and a generalized linear model as the meta-learner. The ensemble model achieved the highest AUC (0.759), outperforming all individual models. Results are shown in <xref ref-type="table" rid="tab11">Table 11</xref>.</p>
<table-wrap position="float" id="tab11">
<label>Table 11</label>
<caption>
<p>Comparison of AUC values for each model after integration.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Algorithm</th>
<th align="center" valign="top">AUC</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Ensemble</td>
<td align="char" valign="middle" char=".">0.759</td>
</tr>
<tr>
<td align="left" valign="middle">Neural network</td>
<td align="char" valign="middle" char=".">0.746</td>
</tr>
<tr>
<td align="left" valign="middle">Decision tree</td>
<td align="char" valign="middle" char=".">0.65</td>
</tr>
<tr>
<td align="left" valign="middle">Random forest</td>
<td align="char" valign="middle" char=".">0.727</td>
</tr>
<tr>
<td align="left" valign="middle">K-nearest neighbors</td>
<td align="char" valign="middle" char=".">0.725</td>
</tr>
<tr>
<td align="left" valign="middle">Support vector machine</td>
<td align="char" valign="middle" char=".">0.708</td>
</tr>
<tr>
<td align="left" valign="middle">Na&#x00EF;ve Bayes</td>
<td align="char" valign="middle" char=".">0.731</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
</sec>
<sec sec-type="discussion" id="sec37">
<label>4</label>
<title>Discussion</title>
<p>Musculoskeletal disorders affect about one-fifth of the world&#x2019;s population and are a leading cause of disability and reduced quality of life worldwide (<xref ref-type="bibr" rid="ref5">5</xref>). WMSD is an emerging focus of public health and occupational health research due to its substantial impact on worker well-being and organizational productivity. These conditions are particularly prevalent in physically demanding industries, where repetitive motion, sustained awkward postures, and biomechanical strain are common. Beyond the individual burden, WMSD contributes to increased absenteeism, reduced work efficiency, and escalating healthcare and social insurance costs. As a result, identifying and predicting determinants of WMSD would aid in targeted interventions to mitigate risk and improve workforce sustainability.</p>
<p>In this study, the 12-month prevalence of WMSD among Chinese coal miners was 82%, with the neck, shoulders, and lower back being the most frequently affected sites. This prevalence was higher than that reported among workers in some manufacturing and service sectors (<xref ref-type="bibr" rid="ref17">17</xref>, <xref ref-type="bibr" rid="ref18">18</xref>), but comparable to estimates from studies conducted in similar mining occupations (<xref ref-type="bibr" rid="ref19">19</xref>). Previous epidemiological studies have consistently shown a higher prevalence of WMSDs among mining workers compared with the general industrial workforce (<xref ref-type="bibr" rid="ref20">20</xref>). This pattern is likely related to sustained heavy physical workload, repetitive work tasks, and constrained working postures. Overall, differences in WMSD prevalence across regions appear to largely reflect variations in occupational workload and working conditions. The high prevalence of multisite WMSD (86.3%) further emphasizes the cumulative nature of these disorders in physically intensive occupations such as coal mining.</p>
<p>The etiopathology of WMSD involves a complex interplay of behavioral, occupational and environmental factors. Our findings indicate that the length of employment is a significant predictor of WMSD, consistent with prior research that associates prolonged occupational exposure with musculoskeletal injuries (<xref ref-type="bibr" rid="ref7">7</xref>, <xref ref-type="bibr" rid="ref21">21</xref>, <xref ref-type="bibr" rid="ref22">22</xref>). This may be due to the compounding effect of aging with sustained physical exertion, which contributes to progressive tissue damage, inadvertently increasing the risk of injury and leading to WMSD. Our observations reinforce the understanding of WMSD as cumulative traumas disorders, often resulting from repetitive strain and biomechanical overload.</p>
<p>Regarding individual behavioral factors, our study found physical activity to be a protective factor against WMSD. Workers who engaged in regular exercise had a lower prevalence of WMSD, consistent with existing literature that highlights the role physical activity has in enhancing musculoskeletal resilience and reducing occupational injury (<xref ref-type="bibr" rid="ref23">23</xref>). Conversely, smoking was associated with an increased risk of WMSD. This may be attributed to smoking-induced vascular impairment, systemic inflammation, reduced bone mineral density, and heightened pain sensitivity (<xref ref-type="bibr" rid="ref24 ref25 ref26">24&#x2013;26</xref>). Additionally, smoking-related habits and stress may contribute to poor posture and increased muscle tension, which can further exacerbate the musculoskeletal strain.</p>
<p>Regarding occupational exposure factors, biomedical stressors, particularly the need to maintain static postures for extended periods of time, were also found to significantly increase the risk of WMSD. This finding concurs with prior research identifying prolonged static loading and repetitive movements in coal mining operations as principal risk factors for WMSD (<xref ref-type="bibr" rid="ref27">27</xref>, <xref ref-type="bibr" rid="ref28">28</xref>). Muscle fatigue resulting from sustained postural demands can lead to chronic tension and microtrauma. Environmental exposures, such as working in cold or fluctuating temperatures, were similarly linked to increased WMSD prevalence. Miners operating in low-temperature conditions reported higher rates of musculoskeletal complaints, a trend supported by research indicating that cold environments amplify physical strain and reduce tissue elasticity, thereby increasing injury susceptibility (<xref ref-type="bibr" rid="ref29">29</xref>). These findings highlight the importance of improving occupational and ergonomic assessments to prevent WMSD, particularly among smokers and those with long tenures.</p>
<p>Perceived health status is regarded as a comprehensive indicator reflecting an individual&#x2019;s overall physiological, psychological, and functional state (<xref ref-type="bibr" rid="ref30">30</xref>). This study found that perceived health status is one of the key indicators for predicting the risk of work-related musculoskeletal injuries: workers who self-reported poorer health had a significantly higher prevalence of musculoskeletal injuries compared to those who self-reported better health. This conclusion aligns with previous research findings among occupational populations. Previous studies indicate that among occupational groups such as healthcare workers and cleaners, individuals with poorer perceived health exhibit a significantly elevated risk of musculoskeletal symptoms, even after controlling for demographic characteristics and work-related factors (<xref ref-type="bibr" rid="ref1">1</xref>, <xref ref-type="bibr" rid="ref30">30</xref>). From a mechanistic perspective, poorer perceived health may reflect diminished physical function, reduced musculoskeletal tolerance, or increased burden of underlying chronic conditions. These factors compromise an individual&#x2019;s capacity to adapt to occupational exposures, such as prolonged physical labor, repetitive tasks, and poor work postures. Consequently, the decline in physiological reserves under sustained occupational stress may facilitate the onset of musculoskeletal injuries or exacerbate the persistence and worsening of existing WMSD symptoms.</p>
<p>From the perspective of occupational health practice and policy formulation, our findings hold significant implications. Among the multiple predictors identified in this study, certain factors&#x2014;such as rest period scheduling, work posture, repetitive motions, and workplace environmental conditions&#x2014;are highly amenable to intervention. This suggests that optimizing ergonomic design, rationally configuring work-rest systems, and improving workplace environments can effectively reduce the risk of WMSD occurrence at the practical level. Concurrently, the findings support integrating health promotion measures&#x2014;such as encouraging physical activity and implementing tobacco control interventions&#x2014;into occupational health management systems, with particular emphasis on targeted prevention for long-tenured employees and those in high-exposure positions. At the policy level, this study provides empirical evidence for developing and refining occupational hygiene standards, ergonomic guidelines, and labor protection policies, thereby advancing the implementation of prevention-oriented, comprehensive WMSD control strategies.</p>
<p>Results of our predictive modeling demonstrate that among the individual models built, NN and NB yields the most accurate predictions. The stacking ensemble model further improved overall performance, achieving an AUC of 0.759, which represents a 7.8% increase compared with the NN model. This substantial improvement can be attributed to the ability of the stacking approach to effectively integrate the prediction outputs of multiple base learners, thereby leveraging the complementary strengths of different modeling strategies in feature representation and decision-making. The stacking ensemble reduces the risk of overfitting associated with single models while substantially enhancing generalization performance. This conclusion concurs with recent studies in infectious disease, heart disease, breast cancer and lung adenocarcinoma, and peritoneal dialysis treatment predictions where stacking models demonstrated better performance (<xref ref-type="bibr" rid="ref31 ref32 ref33 ref34 ref35">31&#x2013;35</xref>).</p>
<p>Despite the notable performance advantages of stacking ensemble models, several practical considerations should be acknowledged when translating these approaches into real-world applications. Compared with single models, ensemble learning methods are generally associated with higher computational costs due to the need to train multiple base learners and a meta-learner. Moreover, their development and deployment require specific technological infrastructure and reliance on advanced technical skills related to machine learning model construction, parameter tuning, and performance evaluation. These factors may limit the widespread adoption of stacking models in routine occupational health practice. Future research should therefore focus on reducing computational complexity, optimizing ensemble strategies, and developing user-friendly tools to facilitate broader implementation across diverse application settings.</p>
<p>In addition to identifying key predictors, the machine learning models developed in this study have potential applicability in occupational health practice. Based on routinely available demographic, work-related, and health-related information, these models can be used to estimate individual-level risk of work-related musculoskeletal disorders (WMSDs), thereby facilitating early identification and risk stratification of high-risk workers. Recent study has demonstrated the feasibility of applying machine learning approaches for WMSD risk prediction and prevention-oriented occupational health management, supporting their use as decision-support tools rather than diagnostic instruments (<xref ref-type="bibr" rid="ref36">36</xref>). Such models could be integrated into routine occupational health examinations or workplace health surveillance systems to support targeted preventive interventions, while further prospective validation is warranted to assess their generalizability and real-world performance.</p>
<p>To the best of our knowledge, our research is the first to use multiple machine learning algorithms to predict the risk of occurrence of WMSD in coal miners. Based on the six individual models constructed, an advanced stacking ensemble learning approach was further applied to effectively integrate the machine learning models, thereby enhancing overall predictive performance.</p>
<p>The study has a few limitations. Our study was conducted across two mining companies in one region of China. We have limited our study to this setting for pragmatic reasons in being able to access the participants and number needed. Furthermore, this epidemiologic study relied predominately on self-reported questionnaires, recall bias and other biases associated with questionnaire-based research cannot be avoided despite strict quality control during the survey process. The primary objective of this study was to identify key predictive factors based on a relatively large dataset, with the research focus placed on individual-level occupational exposure characteristics and health outcomes. Accordingly, the study site was not incorporated at the analytical level, which to some extent limited the assessment of potential heterogeneity between the two study locations. Future studies incorporating site-level information may further explore stratified or multilevel analytical approaches.</p>
</sec>
<sec sec-type="conclusions" id="sec38">
<label>5</label>
<title>Conclusion</title>
<p>Our study confirmed that neck, shoulders, and lower back discomfort are highly prevalent among coal miners, underscoring the occupational burden of WMSD in this population. Numerous individual and work-related factors were significantly associated with the development of WMSD. These factors appeared to develop cumulatively over time. Importantly, our research demonstrated that machine learning algorithms can be used to predict WMSD risk with high accuracy. By integrating six base models using the stacking ensemble method, we achieved better predictive performance than any single model. This highlights the potential of ensemble learning to enhance the precision and reliability of risk prediction in complex, high-dimensional datasets.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec39">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="author-contributions" id="sec40">
<title>Author contributions</title>
<p>JL: Conceptualization, Data curation, Formal analysis, Investigation, Methodology, Supervision, Validation, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. XZ: Data curation, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. YLi: Data curation, Validation, Visualization, Writing &#x2013; review &#x0026; editing. WDi: Writing &#x2013; review &#x0026; editing. WDu: Writing &#x2013; review &#x0026; editing. DL: Writing &#x2013; review &#x0026; editing, Methodology, Validation. YLia: Writing &#x2013; review &#x0026; editing, Investigation, Supervision. ZF: Funding acquisition, Investigation, Resources, Supervision, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We sincerely thank all the personnel of Jining Center for Disease Control and Prevention who participated in this study. We gratefully acknowledge the use of Microsoft Word Editor and Grammar (version 1.2.167.1681) to enhance the clarity and fluency of the final manuscript. Data from the large language model was used to inform the drafting process; however, generative artificial intelligence was not employed in collecting or analyzing research data.</p>
</ack>
<sec sec-type="COI-statement" id="sec41">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
<p>The reviewer AH declared a past collaboration with the author DL to the handling editor.</p>
</sec>
<sec sec-type="ai-statement" id="sec42">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec43">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec44">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fpubh.2026.1729879/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fpubh.2026.1729879/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>J</given-names></name> <name><surname>Cui</surname> <given-names>Y</given-names></name> <name><surname>He</surname> <given-names>L</given-names></name> <name><surname>Xu</surname> <given-names>X</given-names></name> <name><surname>Yuan</surname> <given-names>Z</given-names></name> <name><surname>Jin</surname> <given-names>X</given-names></name> <etal/></person-group>. <article-title>Work-related musculoskeletal disorders and risk factors among Chinese medical staff of obstetrics and gynecology</article-title>. <source>Int J Environ Res Public Health</source>. (<year>2017</year>) <volume>14</volume>:<fpage>562</fpage>&#x2013;<lpage>70</lpage>. doi: <pub-id pub-id-type="doi">10.3390/ijerph14060562</pub-id>, <pub-id pub-id-type="pmid">28587123</pub-id></mixed-citation></ref>
<ref id="ref2"><label>2.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nazerian</surname> <given-names>R</given-names></name> <name><surname>Korhan</surname> <given-names>O</given-names></name> <name><surname>Shakeri</surname> <given-names>E</given-names></name></person-group>. <article-title>Work-related musculoskeletal discomfort among heavy truck drivers</article-title>. <source>Int J Occup Saf Ergon</source>. (<year>2020</year>) <volume>26</volume>:<fpage>233</fpage>&#x2013;<lpage>44</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10803548.2018.1433107</pub-id>, <pub-id pub-id-type="pmid">29433379</pub-id></mixed-citation></ref>
<ref id="ref3"><label>3.</label><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>GF</given-names></name> <name><surname>Wu</surname> <given-names>TC</given-names></name> <name><surname>Niu</surname> <given-names>Q</given-names></name></person-group>. <source>Occupational health and occupational medicine</source>. <publisher-loc>Beijing, China</publisher-loc>: <publisher-name>People's Medical Publishing House</publisher-name> (<year>2012</year>).</mixed-citation></ref>
<ref id="ref4"><label>4.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Fatoye</surname> <given-names>F</given-names></name> <name><surname>Gebrye</surname> <given-names>T</given-names></name> <name><surname>Mbada</surname> <given-names>C</given-names></name> <name><surname>Useh</surname> <given-names>U</given-names></name></person-group>. <article-title>Economic evaluations of digital health interventions for the Management of Musculoskeletal Disorders: systematic review and Meta-analysis</article-title>. <source>J Med Internet Res</source>. (<year>2023</year>) <volume>25</volume>:<fpage>e41113</fpage>. doi: <pub-id pub-id-type="doi">10.2196/41113</pub-id>, <pub-id pub-id-type="pmid">37410542</pub-id></mixed-citation></ref>
<ref id="ref5"><label>5.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Cieza</surname> <given-names>A</given-names></name> <name><surname>Causey</surname> <given-names>K</given-names></name> <name><surname>Kamenov</surname> <given-names>K</given-names></name> <name><surname>Hanson</surname> <given-names>SW</given-names></name> <name><surname>Chatterji</surname> <given-names>S</given-names></name> <name><surname>Vos</surname> <given-names>T</given-names></name></person-group>. <article-title>Global estimates of the need for rehabilitation based on the global burden of disease study 2019: a systematic analysis for the global burden of disease study 2019</article-title>. <source>Lancet</source>. (<year>2021</year>) <volume>396</volume>:<fpage>2006</fpage>&#x2013;<lpage>17</lpage>. doi: <pub-id pub-id-type="doi">10.1016/s0140-6736(20)32340-0</pub-id>, <pub-id pub-id-type="pmid">33275908</pub-id></mixed-citation></ref>
<ref id="ref6"><label>6.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Punnett</surname> <given-names>L</given-names></name> <name><surname>Wegman</surname> <given-names>DH</given-names></name></person-group>. <article-title>Work-related musculoskeletal disorders: the epidemiologic evidence and the debate</article-title>. <source>J Electromyogr Kinesiol</source>. (<year>2004</year>) <volume>14</volume>:<fpage>13</fpage>&#x2013;<lpage>23</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jelekin.2003.09.015</pub-id>, <pub-id pub-id-type="pmid">14759746</pub-id></mixed-citation></ref>
<ref id="ref7"><label>7.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>He</surname> <given-names>X</given-names></name> <name><surname>Xiao</surname> <given-names>B</given-names></name> <name><surname>Wu</surname> <given-names>J</given-names></name> <name><surname>Chen</surname> <given-names>C</given-names></name> <name><surname>Li</surname> <given-names>W</given-names></name> <name><surname>Yan</surname> <given-names>M</given-names></name></person-group>. <article-title>Prevalence of work-related musculoskeletal disorders among Workers in the Automobile Manufacturing Industry in China: a systematic review and meta-analysis</article-title>. <source>BMC Public Health</source>. (<year>2023</year>) <volume>23</volume>:<fpage>2042</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12889-023-16896-x</pub-id>, <pub-id pub-id-type="pmid">37858206</pub-id></mixed-citation></ref>
<ref id="ref8"><label>8.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>YT</given-names></name> <name><surname>Li</surname> <given-names>XX</given-names></name> <name><surname>Hu</surname> <given-names>WJ</given-names></name> <name><surname>Wang</surname> <given-names>D</given-names></name> <name><surname>Zhang</surname> <given-names>SY</given-names></name> <name><surname>Liu</surname> <given-names>AQ</given-names></name> <etal/></person-group>. <article-title>Geographic distribution of coal enterprises and workers exposed to coal dust in China in 2020</article-title>. <source>Biomed Environ Sci</source>. (<year>2023</year>) <volume>36</volume>:<fpage>476</fpage>&#x2013;<lpage>80</lpage>. doi: <pub-id pub-id-type="doi">10.3967/bes2023.058</pub-id>, <pub-id pub-id-type="pmid">37253675</pub-id></mixed-citation></ref>
<ref id="ref9"><label>9.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>Y</given-names></name> <name><surname>Zhang</surname> <given-names>Z</given-names></name> <name><surname>Gao</surname> <given-names>S</given-names></name> <name><surname>Yan</surname> <given-names>H</given-names></name> <name><surname>Zhang</surname> <given-names>L</given-names></name> <name><surname>Liu</surname> <given-names>J</given-names></name></person-group>. <article-title>The status of occupational burnout and its influence on the psychological health of factory workers and miners in Wulumuqi, China</article-title>. <source>Biomed Res Int</source>. (<year>2020</year>) <volume>2020</volume>:<fpage>6890186</fpage>. doi: <pub-id pub-id-type="doi">10.1155/2020/6890186</pub-id>, <pub-id pub-id-type="pmid">32190676</pub-id></mixed-citation></ref>
<ref id="ref10"><label>10.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>L</given-names></name> <name><surname>Guo</surname> <given-names>S</given-names></name> <name><surname>Long</surname> <given-names>L</given-names></name></person-group>. <article-title>Correlation analysis of occupational musculoskeletal disorders and occupational stress in coal miners</article-title>. <source>Indust Health Occupat Dis</source>. (<year>2019</year>) <volume>45</volume>:<fpage>460</fpage>&#x2013;<lpage>2+5</lpage>. doi: <pub-id pub-id-type="doi">10.13692/j.cnki.gywsyzyb.2019.06.012</pub-id></mixed-citation></ref>
<ref id="ref11"><label>11.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Burstr&#x00F6;m</surname> <given-names>L</given-names></name> <name><surname>Aminoff</surname> <given-names>A</given-names></name> <name><surname>Bj&#x00F6;r</surname> <given-names>B</given-names></name> <name><surname>M&#x00E4;ntt&#x00E4;ri</surname> <given-names>S</given-names></name> <name><surname>Nilsson</surname> <given-names>T</given-names></name> <name><surname>Pettersson</surname> <given-names>H</given-names></name> <etal/></person-group>. <article-title>Musculoskeletal symptoms and exposure to whole-body vibration among open-pit mine Workers in the Arctic</article-title>. <source>Int J Occup Med Environ Health</source>. (<year>2017</year>) <volume>30</volume>:<fpage>553</fpage>&#x2013;<lpage>64</lpage>. doi: <pub-id pub-id-type="doi">10.13075/ijomeh.1896.00975</pub-id>, <pub-id pub-id-type="pmid">28584322</pub-id></mixed-citation></ref>
<ref id="ref12"><label>12.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X</given-names></name> <name><surname>Bie</surname> <given-names>F</given-names></name> <name><surname>Li</surname> <given-names>X</given-names></name> <name><surname>Wang</surname> <given-names>Z</given-names></name></person-group>. <article-title>Investigation and research on musculoskeletal disorders and related factors in coal mine workers</article-title>. <source>Chin J Indust Med</source>. (<year>2020</year>) <volume>33</volume>:<fpage>211</fpage>&#x2013;<lpage>6</lpage>. doi: <pub-id pub-id-type="doi">10.13631/j.cnki.zggyyx.2020.03.004</pub-id></mixed-citation></ref>
<ref id="ref13"><label>13.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yi</surname> <given-names>X</given-names></name> <name><surname>Yang</surname> <given-names>J</given-names></name> <name><surname>Gao</surname> <given-names>X</given-names></name> <name><surname>Li</surname> <given-names>F</given-names></name></person-group>. <article-title>The relationship between occupational stress, mental health and work ability of coal chemical Workers in Xinjiang</article-title>. <source>Front Psych</source>. (<year>2022</year>) <volume>13</volume>:<fpage>903534</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyt.2022.903534</pub-id>, <pub-id pub-id-type="pmid">36061289</pub-id></mixed-citation></ref>
<ref id="ref14"><label>14.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>von Elm</surname> <given-names>E</given-names></name> <name><surname>Altman</surname> <given-names>DG</given-names></name> <name><surname>Egger</surname> <given-names>M</given-names></name> <name><surname>Pocock</surname> <given-names>SJ</given-names></name> <name><surname>G&#x00F8;tzsche</surname> <given-names>PC</given-names></name> <name><surname>Vandenbroucke</surname> <given-names>JP</given-names></name></person-group>. <article-title>The strengthening the reporting of observational studies in epidemiology (Strobe) statement: guidelines for reporting observational studies</article-title>. <source>Lancet</source>. (<year>2007</year>) <volume>370</volume>:<fpage>1453</fpage>&#x2013;<lpage>7</lpage>. doi: <pub-id pub-id-type="doi">10.1016/s0140-6736(07)61602-x</pub-id></mixed-citation></ref>
<ref id="ref15"><label>15.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>L</given-names></name> <name><surname>Hildebrandt</surname> <given-names>V</given-names></name> <name><surname>Yu</surname> <given-names>S</given-names></name> <name><surname>Ling</surname> <given-names>R</given-names></name> <name><surname>He</surname> <given-names>L</given-names></name> <name><surname>Chen</surname> <given-names>W</given-names></name> <etal/></person-group>. <article-title>Introduction of a musculoskeletal disorders questionnaire with the questionnaire attached</article-title>. <source>Indust Health Occupat Dis</source>. (<year>2009</year>) <volume>35</volume>:<fpage>25</fpage>&#x2013;<lpage>31</lpage>. doi: <pub-id pub-id-type="doi">10.13692/j.cnki.gywsyzyb.2009.01.001</pub-id></mixed-citation></ref>
<ref id="ref16"><label>16.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>D</given-names></name> <name><surname>Lu</surname> <given-names>L</given-names></name> <name><surname>Hu</surname> <given-names>H</given-names></name> <name><surname>He</surname> <given-names>Z</given-names></name> <name><surname>Lin</surname> <given-names>X</given-names></name> <name><surname>Jia</surname> <given-names>N</given-names></name> <etal/></person-group>. <article-title>Analysis of risk factors of multi-site work-related musculoskeletal disorders among workers in the industry of electronic equipment manufacturing</article-title>. <source>China Occupat Med</source>. (<year>2020</year>) <volume>47</volume>:<fpage>253</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.11763/j.issn.2095-2619.2020.03.003</pub-id></mixed-citation></ref>
<ref id="ref17"><label>17.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>W</given-names></name> <name><surname>Chen</surname> <given-names>Y</given-names></name></person-group>. <article-title>Prevalence and risk factors of work-related musculoskeletal disorders among older hospital cleaners in Wenzhou, China</article-title>. <source>Front Public Health</source>. (<year>2025</year>) <volume>13</volume>:<fpage>1727574</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpubh.2025.1727574</pub-id>, <pub-id pub-id-type="pmid">41383328</pub-id></mixed-citation></ref>
<ref id="ref18"><label>18.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ding</surname> <given-names>X</given-names></name> <name><surname>Guan</surname> <given-names>Z</given-names></name> <name><surname>Liu</surname> <given-names>N</given-names></name> <name><surname>Bi</surname> <given-names>M</given-names></name> <name><surname>Ji</surname> <given-names>F</given-names></name> <name><surname>Wang</surname> <given-names>H</given-names></name> <etal/></person-group>. <article-title>Prevalence and risk factors of work-related musculoskeletal disorders among emerging manufacturing workers in Beijing, China</article-title>. <source>Front Med</source>. (<year>2023</year>) <volume>10</volume>:<fpage>1289046</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fmed.2023.1289046</pub-id>, <pub-id pub-id-type="pmid">37901405</pub-id></mixed-citation></ref>
<ref id="ref19"><label>19.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Deng</surname> <given-names>H</given-names></name> <name><surname>He</surname> <given-names>D</given-names></name> <name><surname>Li</surname> <given-names>F</given-names></name></person-group>. <article-title>Factors influencing job burnout and musculoskeletal disorders among coal miners in the Xinjiang Uygur autonomous region</article-title>. <source>Pain Res Manag</source>. (<year>2021</year>) <volume>2021</volume>:<fpage>6629807</fpage>. doi: <pub-id pub-id-type="doi">10.1155/2021/6629807</pub-id>, <pub-id pub-id-type="pmid">33628352</pub-id></mixed-citation></ref>
<ref id="ref20"><label>20.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Robinson</surname> <given-names>T</given-names></name> <name><surname>Sussell</surname> <given-names>A</given-names></name> <name><surname>Scott</surname> <given-names>K</given-names></name> <name><surname>Poplin</surname> <given-names>G</given-names></name></person-group>. <article-title>Health conditions among male Workers in Mining and Other Industries Reliant on manual labor occupations: National Health Interview Survey, 2007-2018</article-title>. <source>Am J Ind Med</source>. (<year>2023</year>) <volume>66</volume>:<fpage>692</fpage>&#x2013;<lpage>704</lpage>. doi: <pub-id pub-id-type="doi">10.1002/ajim.23483</pub-id>, <pub-id pub-id-type="pmid">37132409</pub-id></mixed-citation></ref>
<ref id="ref21"><label>21.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Leite</surname> <given-names>W</given-names></name> <name><surname>Ara&#x00FA;jo</surname> <given-names>A</given-names></name> <name><surname>Norte da Silva</surname> <given-names>JM</given-names></name> <name><surname>Gontijo</surname> <given-names>LA</given-names></name> <name><surname>Vieira</surname> <given-names>EMA</given-names></name> <name><surname>Lopes de Souza</surname> <given-names>E</given-names></name> <etal/></person-group>. <article-title>Risk factors for work-related musculoskeletal disorders among Workers in the Footwear Industry: a cross-sectional study</article-title>. <source>Int J Occup Saf Ergon</source>. (<year>2021</year>) <volume>27</volume>:<fpage>393</fpage>&#x2013;<lpage>409</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10803548.2019.1579966</pub-id>, <pub-id pub-id-type="pmid">30735099</pub-id></mixed-citation></ref>
<ref id="ref22"><label>22.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>F</given-names></name> <name><surname>Di</surname> <given-names>N</given-names></name> <name><surname>Guo</surname> <given-names>WW</given-names></name> <name><surname>Ding</surname> <given-names>WB</given-names></name> <name><surname>Jia</surname> <given-names>N</given-names></name> <name><surname>Zhang</surname> <given-names>H</given-names></name> <etal/></person-group>. <article-title>The prevalence and risk factors of work related musculoskeletal disorders among electronics manufacturing workers: a cross-sectional analytical study in China</article-title>. <source>BMC Public Health</source>. (<year>2023</year>) <volume>23</volume>:<fpage>10</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12889-022-14952-6</pub-id>, <pub-id pub-id-type="pmid">36597111</pub-id></mixed-citation></ref>
<ref id="ref23"><label>23.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ribas</surname> <given-names>TM</given-names></name> <name><surname>Teodori</surname> <given-names>RM</given-names></name> <name><surname>Mescolotto</surname> <given-names>FF</given-names></name> <name><surname>Montebelo</surname> <given-names>MIL</given-names></name> <name><surname>Baruki</surname> <given-names>SBS</given-names></name> <name><surname>Pazzianotto-Forti</surname> <given-names>EM</given-names></name></person-group>. <article-title>Impact of physical activity levels on musculoskeletal symptoms and absenteeism of Workers of a Metallurgical Company</article-title>. <source>Rev Bras Med Trab</source>. (<year>2021</year>) <volume>18</volume>:<fpage>425</fpage>&#x2013;<lpage>33</lpage>. doi: <pub-id pub-id-type="doi">10.47626/1679-4435-2020-572</pub-id>, <pub-id pub-id-type="pmid">33688324</pub-id></mixed-citation></ref>
<ref id="ref24"><label>24.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Guan</surname> <given-names>SY</given-names></name> <name><surname>Zheng</surname> <given-names>JX</given-names></name> <name><surname>Sam</surname> <given-names>NB</given-names></name> <name><surname>Xu</surname> <given-names>S</given-names></name> <name><surname>Shuai</surname> <given-names>Z</given-names></name> <name><surname>Pan</surname> <given-names>F</given-names></name></person-group>. <article-title>Global burden and risk factors of musculoskeletal disorders among adolescents and young adults in 204 countries and territories, 1990-2019</article-title>. <source>Autoimmun Rev</source>. (<year>2023</year>) <volume>22</volume>:<fpage>103361</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.autrev.2023.103361</pub-id>, <pub-id pub-id-type="pmid">37230312</pub-id></mixed-citation></ref>
<ref id="ref25"><label>25.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Curtis</surname> <given-names>E</given-names></name> <name><surname>Litwic</surname> <given-names>A</given-names></name> <name><surname>Cooper</surname> <given-names>C</given-names></name> <name><surname>Dennison</surname> <given-names>E</given-names></name></person-group>. <article-title>Determinants of muscle and bone aging</article-title>. <source>J Cell Physiol</source>. (<year>2015</year>) <volume>230</volume>:<fpage>2618</fpage>&#x2013;<lpage>25</lpage>. doi: <pub-id pub-id-type="doi">10.1002/jcp.25001</pub-id>, <pub-id pub-id-type="pmid">25820482</pub-id></mixed-citation></ref>
<ref id="ref26"><label>26.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kondo</surname> <given-names>T</given-names></name> <name><surname>Nakano</surname> <given-names>Y</given-names></name> <name><surname>Adachi</surname> <given-names>S</given-names></name> <name><surname>Murohara</surname> <given-names>T</given-names></name></person-group>. <article-title>Effects of tobacco smoking on cardiovascular disease</article-title>. <source>Circ J</source>. (<year>2019</year>) <volume>83</volume>:<fpage>1980</fpage>&#x2013;<lpage>5</lpage>. doi: <pub-id pub-id-type="doi">10.1253/circj.CJ-19-0323</pub-id>, <pub-id pub-id-type="pmid">31462607</pub-id></mixed-citation></ref>
<ref id="ref27"><label>27.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jia</surname> <given-names>N</given-names></name> <name><surname>Zhang</surname> <given-names>M</given-names></name> <name><surname>Zhang</surname> <given-names>H</given-names></name> <name><surname>Ling</surname> <given-names>R</given-names></name> <name><surname>Liu</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>G</given-names></name> <etal/></person-group>. <article-title>Prevalence and risk factors analysis for low Back pain among occupational groups in key Industries of China</article-title>. <source>BMC Public Health</source>. (<year>2022</year>) <volume>22</volume>:<fpage>1493</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12889-022-13730-8</pub-id>, <pub-id pub-id-type="pmid">35931976</pub-id></mixed-citation></ref>
<ref id="ref28"><label>28.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Das</surname> <given-names>B</given-names></name></person-group>. <article-title>Work-related injuries, postural stress, and musculoskeletal disorders among the railway track maintainers in India</article-title>. <source>Toxicol Ind Health</source>. (<year>2020</year>) <volume>36</volume>:<fpage>371</fpage>&#x2013;<lpage>85</lpage>. doi: <pub-id pub-id-type="doi">10.1177/0748233720932815</pub-id>, <pub-id pub-id-type="pmid">32546106</pub-id></mixed-citation></ref>
<ref id="ref29"><label>29.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yong</surname> <given-names>X</given-names></name> <name><surname>Li</surname> <given-names>F</given-names></name> <name><surname>Ge</surname> <given-names>H</given-names></name> <name><surname>Sun</surname> <given-names>X</given-names></name> <name><surname>Ma</surname> <given-names>X</given-names></name> <name><surname>Liu</surname> <given-names>J</given-names></name></person-group>. <article-title>A cross-sectional epidemiological survey of work-related musculoskeletal disorders and analysis of its influencing factors among coal mine workers in Xinjiang</article-title>. <source>Biomed Res Int</source>. (<year>2020</year>) <volume>2020</volume>:<fpage>3164056</fpage>. doi: <pub-id pub-id-type="doi">10.1155/2020/3164056</pub-id>, <pub-id pub-id-type="pmid">32851062</pub-id></mixed-citation></ref>
<ref id="ref30"><label>30.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Sotrate Gon&#x00E7;alves</surname> <given-names>J</given-names></name> <name><surname>de Oliveira Sato</surname> <given-names>T</given-names></name></person-group>. <article-title>Factors associated with musculoskeletal symptoms and heart rate variability among cleaners &#x2013; cross-sectional study</article-title>. <source>BMC Public Health</source>. (<year>2020</year>) <volume>20</volume>:<fpage>774</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12889-020-08928-7</pub-id>, <pub-id pub-id-type="pmid">32448172</pub-id></mixed-citation></ref>
<ref id="ref31"><label>31.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yao</surname> <given-names>T</given-names></name> <name><surname>Chen</surname> <given-names>X</given-names></name> <name><surname>Wang</surname> <given-names>H</given-names></name> <name><surname>Gao</surname> <given-names>C</given-names></name> <name><surname>Chen</surname> <given-names>J</given-names></name> <name><surname>Yi</surname> <given-names>D</given-names></name> <etal/></person-group>. <article-title>Deep evolutionary fusion neural network: a new prediction standard for infectious disease incidence rates</article-title>. <source>BMC Bioinformat</source>. (<year>2024</year>) <volume>25</volume>:<fpage>38</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12859-023-05621-5</pub-id>, <pub-id pub-id-type="pmid">38262917</pub-id></mixed-citation></ref>
<ref id="ref32"><label>32.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gao</surname> <given-names>L</given-names></name> <name><surname>Ding</surname> <given-names>Y</given-names></name></person-group>. <article-title>Disease prediction via Bayesian Hyperparameter optimization and ensemble learning</article-title>. <source>BMC Res Notes</source>. (<year>2020</year>) <volume>13</volume>:<fpage>205</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13104-020-05050-0</pub-id>, <pub-id pub-id-type="pmid">32276658</pub-id></mixed-citation></ref>
<ref id="ref33"><label>33.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Suo</surname> <given-names>X</given-names></name> <name><surname>Huang</surname> <given-names>X</given-names></name> <name><surname>Zhong</surname> <given-names>L</given-names></name> <name><surname>Luo</surname> <given-names>Q</given-names></name> <name><surname>Ding</surname> <given-names>L</given-names></name> <name><surname>Xue</surname> <given-names>F</given-names></name></person-group>. <article-title>Development and validation of a Bayesian network-based model for predicting coronary heart disease risk from electronic health records</article-title>. <source>J Am Heart Assoc</source>. (<year>2024</year>) <volume>13</volume>:<fpage>e029400</fpage>. doi: <pub-id pub-id-type="doi">10.1161/jaha.123.029400</pub-id>, <pub-id pub-id-type="pmid">38156626</pub-id></mixed-citation></ref>
<ref id="ref34"><label>34.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>X</given-names></name> <name><surname>Yang</surname> <given-names>Q</given-names></name> <name><surname>Wang</surname> <given-names>D</given-names></name> <name><surname>Li</surname> <given-names>Z</given-names></name> <name><surname>Chen</surname> <given-names>N</given-names></name> <name><surname>Kong</surname> <given-names>DX</given-names></name></person-group>. <article-title>Predicting lung adenocarcinoma disease progression using methylation-correlated blocks and ensemble machine learning classifiers</article-title>. <source>PeerJ</source>. (<year>2021</year>) <volume>9</volume>:<fpage>e10884</fpage>. doi: <pub-id pub-id-type="doi">10.7717/peerj.10884</pub-id>, <pub-id pub-id-type="pmid">33628643</pub-id></mixed-citation></ref>
<ref id="ref35"><label>35.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kong</surname> <given-names>G</given-names></name> <name><surname>Wu</surname> <given-names>J</given-names></name> <name><surname>Chu</surname> <given-names>H</given-names></name> <name><surname>Yang</surname> <given-names>C</given-names></name> <name><surname>Lin</surname> <given-names>Y</given-names></name> <name><surname>Lin</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Predicting prolonged length of hospital stay for peritoneal Dialysis-treated patients using stacked generalization: model development and validation study</article-title>. <source>JMIR Med Inform</source>. (<year>2021</year>) <volume>9</volume>:<fpage>e17886</fpage>. doi: <pub-id pub-id-type="doi">10.2196/17886</pub-id>, <pub-id pub-id-type="pmid">34009135</pub-id></mixed-citation></ref>
<ref id="ref36"><label>36.</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>N</given-names></name> <name><surname>Xu</surname> <given-names>X</given-names></name> <name><surname>Jiang</surname> <given-names>B</given-names></name> <name><surname>Zhang</surname> <given-names>Z</given-names></name> <name><surname>Huang</surname> <given-names>J</given-names></name> <name><surname>Zhang</surname> <given-names>X</given-names></name> <etal/></person-group>. <article-title>Explainable machine learning framework to predict the risk of work-related neck and shoulder musculoskeletal disorders among healthcare professionals</article-title>. <source>Front Public Health</source>. (<year>2024</year>) <volume>12</volume>:<fpage>1414209</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpubh.2024.1414209</pub-id>, <pub-id pub-id-type="pmid">39228842</pub-id></mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0002">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/937500/overview">Michele Carugno</ext-link>, University of Milan, Italy</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0003">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1655571/overview">Gianluca Rossetto</ext-link>, San Camillo Hospital (IRCCS), Italy</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1916447/overview">Aram Halimi</ext-link>, Shahid Beheshti University of Medical Sciences, Iran</p>
</fn>
</fn-group>
</back>
</article>