<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="brief-report" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Educ.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Education</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Educ.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2504-284X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/feduc.2025.1657651</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Brief Research Report</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Are U.S. graduate curricula ready to prepare social data scientists for the AI era?</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Dong</surname>
<given-names>Yixiao</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3118434"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Baral</surname>
<given-names>Deodatta</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Baral</surname>
<given-names>Kushmakar</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3130768"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x0026; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Department of Education, University of California, Santa Barbara</institution>, <city>Santa Barbara</city>, <state>CA</state>, <country country="us">United States</country></aff>
<aff id="aff2"><label>2</label><institution>Department of Research Methods and Information Science, University of Denver</institution>, <city>Denver</city>, <state>CO</state>, <country country="us">United States</country></aff>
<author-notes>
<corresp id="c001"><label>&#x002A;</label>Correspondence: Yixiao Dong, <email xlink:href="mailto:ydong@ucsb.edu">ydong@ucsb.edu</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-01-12">
<day>12</day>
<month>01</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>10</volume>
<elocation-id>1657651</elocation-id>
<history>
<date date-type="received">
<day>01</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>06</day>
<month>12</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>12</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Dong, Baral and Baral.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Dong, Baral and Baral</copyright-holder>
<license>
<ali:license_ref start_date="2026-01-12">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>The evolving skill demands of the data science workforce present unique challenges for individuals trained in the social science disciplines. This study examines the readiness of U.S. graduate programs in preparing social data scientists for the AI era. We collected and analyzed publicly available coursework plans (<italic>n</italic>&#x202F;=&#x202F;97) from graduate programs at research universities in the U.S. that focus on training social data scientists. Required skills for data scientists were identified through a random sample of current job postings (<italic>n</italic>&#x202F;=&#x202F;30) on LinkedIn and cross-validated with findings from the relevant literature. Using Python-based web scraping and text content analysis, we identified the 10 most in-demand skills within the data science industry and conducted a binary coding of whether each program offers coursework relevant to these skills. These 10 binary indicators were subsequently analyzed using Rasch modeling. The results indicate notable gaps between graduate curricula and industry expectations, and also highlight the need to reform graduate education to better prepare social data scientists for the new demands of the AI era.</p>
</abstract>
<kwd-group>
<kwd>artificial intelligence</kwd>
<kwd>coursework</kwd>
<kwd>curriculum gap</kwd>
<kwd>data science</kwd>
<kwd>Rasch modeling</kwd>
<kwd>text analysis</kwd>
<kwd>web-scraping</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was not received for this work and/or its publication.</funding-statement>
</funding-group>
<counts>
<fig-count count="1"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="31"/>
<page-count count="6"/>
<word-count count="4795"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Higher Education</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<title>Introduction</title>
<p>Consider this question: What skills are needed for a successful career in data science? Twenty years ago, responses would have emphasized data management, research methodology, and statistical modeling expertise. Today, while these skills remain fundamental, the list of skills in people&#x2019;s responses may expand considerably to include machine learning, natural language processing, Python programming, and artificial intelligence (AI) competencies. Data science has flourished in the 21st century (<xref ref-type="bibr" rid="ref8">Donoho, 2017</xref>; <xref ref-type="bibr" rid="ref27">Schwab-McCoy et al., 2021</xref>). The integration of AI techniques is propelling this field to new heights, which has triggered substantial changes in various ways (<xref ref-type="bibr" rid="ref7">Dong, 2025</xref>; <xref ref-type="bibr" rid="ref13">Ho, 2024</xref>; <xref ref-type="bibr" rid="ref20">Liu et al., 2024</xref>; <xref ref-type="bibr" rid="ref21">Luan et al., 2020</xref>; <xref ref-type="bibr" rid="ref23">Min et al., 2024</xref>). Concurrently, the skill sets required for data scientists are shifting, particularly for those trained in traditional social science disciplines (e.g., Educational Statistics, Quantitative Psychology, and Data Analytics for Social Sciences).</p>
<p>Data scientists represent a broad and somewhat heterogeneous population, given their diverse training in disciplines such as social science, medical science, and computer science (<xref ref-type="bibr" rid="ref8">Donoho, 2017</xref>). Programs and curricula in computer science (or engineering schools) are more likely to keep up with rapid advancements, as they are the <italic>native residents</italic> who initiate the development of AI techniques and make early contributions to introducing AI to the data science field. In contrast, those from the social science family rarely have the first-mover advantage and might lag behind new shifts (<xref ref-type="bibr" rid="ref21">Luan et al., 2020</xref>).</p>
<p>In effect, training in social science disciplines is still striving to catch up with the advanced but conventional skill sets demanded prior to the AI boom in the early 2020s. For example, <xref ref-type="bibr" rid="ref9">Everson (2022)</xref> identifies substantial statistical skills gaps for professors within schools of education, and these gaps are evident in both advanced methods (e.g., propensity score matching, structural equation modeling, and item response theory) and software packages (e.g., R, SAS, and Stata) needed for training educational data scientists. The challenges derived from these gaps could be even more significant for those in minority-serving colleges and universities, where they tend to have less federal and financial support (<xref ref-type="bibr" rid="ref4">Brown, 2013</xref>). The constantly evolving and dynamic nature of data science has been a major hurdle for faculty teaching up-to-date content (<xref ref-type="bibr" rid="ref27">Schwab-McCoy et al., 2021</xref>). Now, AI is reshaping the landscape in data science, as well as the needs of the associated industrial labor market (<xref ref-type="bibr" rid="ref12">Hijazi and Alfaki, 2020</xref>; <xref ref-type="bibr" rid="ref20">Liu et al., 2024</xref>), which may create new challenges or magnify existing ones for training data scientists in the social science fields.</p>
<sec id="sec2">
<title>Current study</title>
<p>Program curricula are undoubtedly a fundamental component of data science education (<xref ref-type="bibr" rid="ref10">Gundlach and Ward, 2021</xref>; <xref ref-type="bibr" rid="ref11">Hardin et al., 2021</xref>; <xref ref-type="bibr" rid="ref25">Nolan and Temple Lang, 2010</xref>; <xref ref-type="bibr" rid="ref27">Schwab-McCoy et al., 2021</xref>). The present study aims to examine the curriculum readiness of graduate programs in preparing social data scientists for the AI era, that is, to investigate whether current graduate curricula in social science disciplines adequately cover the skills required for data scientists in today&#x2019;s evolving landscape. The objective of this study is not to develop a new measure of curriculum readiness, which would typically require comprehensive psychometric validation (e.g., <xref ref-type="bibr" rid="ref1">Boateng et al., 2018</xref>). Rather, we aimed to generate complementary and additional evidence from a measurement-analog model to address our research goal. Furthermore, identifying potential gaps in existing curricula is a crucial step for advancing data science education (<xref ref-type="bibr" rid="ref9">Everson, 2022</xref>; <xref ref-type="bibr" rid="ref11">Hardin et al., 2021</xref>), as well as for promoting effective curriculum reforms. Thus, this research also contributes to broader discussions on how to better align graduate training with the evolving demands placed on data scientists in the AI era.</p>
</sec>
</sec>
<sec sec-type="methods" id="sec3">
<title>Methods</title>
<p>The Methods section outlines the sources of curriculum data from graduate programs, data collection procedures (e.g., web scraping), and a description of the main analyses (i.e., text analysis and Rasch modeling) employed in the current study.</p>
<sec id="sec4">
<title>Data sources and collection procedures</title>
<p>To address the research purpose, we collected data from two sources: (1) web-based curricula data and (2) job posting suggested skill requirement data for data scientists in the AI era.</p>
<p>For the curricula data, we gathered all publicly available Coursework Plans (CWPs, <italic>n</italic>&#x202F;=&#x202F;97) from U.S. universities&#x2019; graduate programs aimed at training social data scientists. These programs included Quantitative Psychology, Measurement and Quantitative Methods, Educational Statistics, and so forth. These social science programs were chosen for a shared goal of equipping graduates with the quantitative and methodological skills for a career in data science. Additionally, we targeted graduate-level programs at R1 and R2 universities (i.e., those with high or very high research activity). This is because research universities place greater emphasis on graduate-level education, whereas teaching universities typically focus more on undergraduate education. Although graduate training is not strictly required for being a data scientist, graduate programs often offer deeper training in areas such as programming, advanced statistics, or machine learning, which are highly valued in data science (<xref ref-type="bibr" rid="ref15">Jiang and Chen, 2022</xref>).</p>
<p>Based on a recent version of the <xref ref-type="bibr" rid="ref5">Carnegie Classification of Institutions of Higher Education (2024)</xref>, we compiled a list of website URLs for the program CWPs through a manual search. Specifically, two researchers scrutinized each research university&#x2019;s websites to locate qualifying programs and CWPs. After that, web scraping was performed using Python (<xref ref-type="bibr" rid="ref24">Mitchell, 2018</xref>) to extract the content of coursework plans from each URL. The web scraping gathered coursework titles and descriptions, skill emphases, and training goals of programs from each website.</p>
<p>For the skill requirement data, we collected the essential or required skills for current data scientists by examining a sample of new job postings in 2024 on LinkedIn. The search terms for locating job postings on LinkedIn included &#x201C;Data Scientist,&#x201D; &#x201C;AI or Artificial Intelligence&#x201D; Research Scientist,&#x201D; and &#x201C;Social Science.&#x201D; In filtering search outcomes, we selected multiple work experience options: &#x201C;Entry,&#x201D; &#x201C;Senior,&#x201D; and &#x201C;Manager&#x201D; to ensure positions required different levels of data science skill proficiency are represented. The locations of search jobs were restricted to the U.S, given the study population. We randomly sampled 30 data scientist job postings, which included industry leaders such as Lockheed Martin, Udemy, Gusto, Deloitte, Google, DoorDash, and UC Health. This sample encompassed organizations from various sectors that may hire data scientists with a social science background, including technology, healthcare, education, and consulting. For each job posting, skill sets (e.g., SQL, Python, and machine learning) were collected and coded based on the specific requirements (e.g., required skills or qualifications) outlined in the job descriptions.</p>
</sec>
<sec id="sec5">
<title>Overview of analysis</title>
<p>The present study primarily utilized content analysis of text through Python (<xref ref-type="bibr" rid="ref26">Sarkar, 2016</xref>), followed by a Rasch analysis of the extracted information and recoded indicators representing curriculum readiness for training social data scientists. First, we examined the frequency of keywords about skills from 30 online data science job postings on LinkedIn. These frequencies highlighted the skills currently demanded or preferred by employers in the U.S. data science industry. Subsequently, using the compiled list of 10 key skills, another text analysis was implemented to analyze the CWP content of the 97 graduate programs in social data science to identify gaps between industry requirements and graduate training. Each CWP was coded via Python following a dichotomous coding scheme to indicate whether each identified skill was reflected from the program&#x2019;s coursework (1&#x202F;=&#x202F;at least one course containing keywords matching the skill; 0&#x202F;=&#x202F;the skill is not reflected in any coursework).</p>
<p>Next, we entered the indicators into a dichotomous Rasch model to quantify the curriculum readiness of each program and to examine the alignment between current social data science graduate curricula and industry demands. The current study does not aim to comprehensively develop or validate a measure via Rasch modeling; however, certain Rasch analysis results (e.g., Wright maps; <xref ref-type="bibr" rid="ref3">Boone et al., 2014</xref>) can effectively reveal and visualize potential skill gaps between graduate training and industry needs. In this study, three Rasch analyses, including unidimensionality, item fit, and construct coverage (i.e., Wright map), were conducted using <italic>Winsteps 5.3.1</italic> (<xref ref-type="bibr" rid="ref18">Linacre, 2022</xref>). It is important to note that all CWPs were collected and analyzed by the summer of 2024, by which time all graduate programs were expected to have released their coursework for the most recent academic year (i.e., 2024&#x2013;2025).</p>
</sec>
</sec>
<sec sec-type="results" id="sec6">
<title>Results</title>
<p>Here, we first present descriptive findings that identify the key skills required for social data scientists in the AI age and assess how well these skills are covered in the analyzed social science graduate curricula. Rasch modeling results are then provided to further demonstrate the gaps between current industry needs and the skills taught in social science graduate programs for training data scientists.</p>
<sec id="sec7">
<title>Demanded skills of data scientists in the AI age</title>
<p>A total of ten key skills were identified from job postings: machine learning (including deep learning), Bayesian analysis, cloud computing, artificial intelligence, statistics, algorithms, programming, Python, SQL, and research. This list was also cross-validated with skills suggested in the literature for data science (e.g., <xref ref-type="bibr" rid="ref14">Ismail and Abidin, 2016</xref>; <xref ref-type="bibr" rid="ref17">Li et al., 2021</xref>) to ensure its coverage and representativeness. These skills predominantly include specialized technical and programming skills such as Python, deep learning, machine learning, and artificial intelligence, as well as general research and statistics skills valued in traditional social data scientist training. The results highlight the high demands of technical skills for social data scientists (<xref ref-type="bibr" rid="ref6">Costa and Santos, 2017</xref>), as well as reflect the evolving nature of the data science field.</p>
</sec>
<sec id="sec8">
<title>Gaps between industry needs and social science graduate curricula for data scientists</title>
<p><xref ref-type="table" rid="tab1">Table 1</xref> summarizes the number and percentage of programs offering courses that cover each data science skill identified from the analyzed job posts, ranked from the lowest to the highest percentages. The majority of graduate programs offer courses covering content related to research (97.94%) and statistics (86.60%). However, beyond these traditional skills, less than 10% of the programs provide training in more advanced technical skills or tools (e.g., machine learning, algorithms, and cloud computing).</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Number and percentage of programs offering courses that cover each data science skill.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>Data science skill</th>
<th align="center" valign="top">
<italic>n</italic>
</th>
<th align="center" valign="top">Percentages</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Cloud computing</td>
<td align="center" valign="top">0</td>
<td align="center" valign="top">0.00%</td>
</tr>
<tr>
<td align="left" valign="top">SQL</td>
<td align="center" valign="top">1</td>
<td align="center" valign="top">1.03%</td>
</tr>
<tr>
<td align="left" valign="top">Artificial intelligence</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">2.06%</td>
</tr>
<tr>
<td align="left" valign="top">Algorithms</td>
<td align="center" valign="top">2</td>
<td align="center" valign="top">2.06%</td>
</tr>
<tr>
<td align="left" valign="top">Python</td>
<td align="center" valign="top">4</td>
<td align="center" valign="top">4.12%</td>
</tr>
<tr>
<td align="left" valign="top">Machine learning</td>
<td align="center" valign="top">6</td>
<td align="center" valign="top">6.19%</td>
</tr>
<tr>
<td align="left" valign="top">Bayesian analysis</td>
<td align="center" valign="top">6</td>
<td align="center" valign="top">6.19%</td>
</tr>
<tr>
<td align="left" valign="top">Programming</td>
<td align="center" valign="top">8</td>
<td align="center" valign="top">8.25%</td>
</tr>
<tr>
<td align="left" valign="top">Statistics</td>
<td align="center" valign="top">84</td>
<td align="center" valign="top">86.60%</td>
</tr>
<tr>
<td align="left" valign="top">Research</td>
<td align="center" valign="top">95</td>
<td align="center" valign="top">97.94%</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>A total skill-coverage score was calculated for each program based on the 10 dichotomously coded skill variables (i.e., whether or not each of the 10 skills was covered by each program). The total score had a possible range from 0 to 10, with lower course-skill coverage scores indicating a more severe misalignment between program training and industrial demands. Among the 97 programs, the mean score was 2.13 out of 10 (<italic>SD</italic>&#x202F;=&#x202F;0.78), with a median of 2, indicating that most programs&#x2019; current coursework covers only a limited number of skills (typically traditional research and statistics skills) required for data scientists in the AI era.</p>
</sec>
<sec id="sec9">
<title>Psychometric evidence and implications from Rasch modeling</title>
<p>In addition to the descriptive statistics presented above, Rasch modeling was applied to quantify and investigate the curriculum readiness of each program for training social data scientists, using nine of the t10 dichotomous skillset indicators. The &#x201C;cloud computing&#x201D; indicator was excluded from the analysis because it showed no variance&#x2014;no program involved in this study offered coursework covering this particular skill.</p>
<p>We first examined the dimensionality of the curriculum readiness items through a principal components analysis of residuals (PCAR). The Rasch dimension accounted for 86.1% of the variance in the observations, while the first contrast in the residuals (i.e., the largest secondary dimension) had a relatively small eigenvalue of 2.78 and explained only 4.3% of the variance. This indicates that the Rasch dimension explained the overwhelming majority of variance in the data, and including a secondary dimension would contribute minimally to explaining additional variance. Collectively, these results provide strong evidence of the unidimensionality of the measure (<xref ref-type="bibr" rid="ref19">Linacre, 2025</xref>).</p>
<p><xref ref-type="table" rid="tab2">Table 2</xref> summarizes the mean square (MNSQ) and standardized (ZSTD) item fit statistics. The &#x201C;Research&#x201D; indicator exhibited an outfit MNSQ of 9.9 and a ZSTD of 9.91, which substantially exceeds the typical acceptable fit range (e.g., MNSQ between 0.6 and 1.4; <xref ref-type="bibr" rid="ref31">Wright and Linacre, 1994</xref>; ZSTD between &#x2212;2 and 2; <xref ref-type="bibr" rid="ref2">Bond and Fox, 2015</xref>). The misfit of the &#x201C;Research&#x201D; indicator suggests that it is not an appropriate item for representing curriculum readiness in the context of AI data science training. This is likely because nearly all collected graduate programs offer research-related coursework, making it ineffective at differentiating program-level readiness.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Summary of item fit statistics.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Items</th>
<th align="center" valign="top" colspan="2">INFIT</th>
<th align="center" valign="top" colspan="2">OUTFIT</th>
</tr>
<tr>
<th align="center" valign="top">MNSQ</th>
<th align="center" valign="top">ZSTD</th>
<th align="center" valign="top">MNSQ</th>
<th align="center" valign="top">ZSTD</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="bottom">Research</td>
<td align="char" valign="bottom" char=".">1.13</td>
<td align="char" valign="bottom" char=".">0.41</td>
<td align="char" valign="bottom" char=".">9.9</td>
<td align="char" valign="bottom" char=".">9.91</td>
</tr>
<tr>
<td align="left" valign="bottom">Bayesian analysis</td>
<td align="char" valign="bottom" char=".">1.24</td>
<td align="char" valign="bottom" char=".">0.9</td>
<td align="char" valign="bottom" char=".">0.28</td>
<td align="char" valign="bottom" char=".">&#x2212;0.46</td>
</tr>
<tr>
<td align="left" valign="bottom">Artificial intelligence</td>
<td align="char" valign="bottom" char=".">1.22</td>
<td align="char" valign="bottom" char=".">0.55</td>
<td align="char" valign="bottom" char=".">0.34</td>
<td align="char" valign="bottom" char=".">&#x2212;0.77</td>
</tr>
<tr>
<td align="left" valign="bottom">SQL</td>
<td align="char" valign="bottom" char=".">1.04</td>
<td align="char" valign="bottom" char=".">0.34</td>
<td align="char" valign="bottom" char=".">0.14</td>
<td align="char" valign="bottom" char=".">&#x2212;2.12</td>
</tr>
<tr>
<td align="left" valign="bottom">Programming</td>
<td align="char" valign="bottom" char=".">1.01</td>
<td align="char" valign="bottom" char=".">0.13</td>
<td align="char" valign="bottom" char=".">0.23</td>
<td align="char" valign="bottom" char=".">&#x2212;0.9</td>
</tr>
<tr>
<td align="left" valign="bottom">Machine learning</td>
<td align="char" valign="bottom" char=".">0.83</td>
<td align="char" valign="bottom" char=".">&#x2212;0.48</td>
<td align="char" valign="bottom" char=".">0.18</td>
<td align="char" valign="bottom" char=".">&#x2212;0.5</td>
</tr>
<tr>
<td align="left" valign="bottom">Algorithms</td>
<td align="char" valign="bottom" char=".">0.7</td>
<td align="char" valign="bottom" char=".">&#x2212;0.37</td>
<td align="char" valign="bottom" char=".">0.09</td>
<td align="char" valign="bottom" char=".">&#x2212;1.62</td>
</tr>
<tr>
<td align="left" valign="bottom">Python</td>
<td align="char" valign="bottom" char=".">0.67</td>
<td align="char" valign="bottom" char=".">&#x2212;0.89</td>
<td align="char" valign="bottom" char=".">0.11</td>
<td align="char" valign="bottom" char=".">&#x2212;0.74</td>
</tr>
<tr>
<td align="left" valign="bottom">Statistics</td>
<td align="char" valign="bottom" char=".">0.34</td>
<td align="char" valign="bottom" char=".">&#x2212;1.79</td>
<td align="char" valign="bottom" char=".">0.09</td>
<td align="char" valign="bottom" char=".">&#x2212;2.45</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>We further examined the alignment between graduate curricula and industry skill demands using a Wright map (see <xref ref-type="fig" rid="fig1">Figure 1</xref>). The curriculum readiness level of programs was placed on the left side of the continuum, while the difficulty levels of the nine skill indicators were plotted on the right. Within the current research context, a more difficult skill indicator generally indicates that programs are less likely to offer coursework covering that skill. From <xref ref-type="fig" rid="fig1">Figure 1</xref>, most skill indicators (all except &#x201C;Statistics&#x201D; and &#x201C;Research&#x201D;) cluster near the upper range of the continuum, between +1.5 and +4 logits. In contrast, programs are concentrated toward the lower end, around the &#x2212;3.5 logit position. These results echo the preliminary descriptive findings and further confirm the existence of a substantial gap between the skills taught in U.S. social science graduate curricula and those demanded by data science industry jobs. Although the general misalignment was evident, several programs demonstrated better alignment. For example, the &#x201C;Statistics/Machine Learning Joint PhD&#x201D; program at Carnegie Mellon University (CMU) was positioned near +3 logits at the high end of the continuum. The program&#x2019;s CWP covers six of the ten outlined skills and has shown the closest alignment between its curriculum and industry demands among the 97 programs analyzed. This finding suggests that a joint training model that integrates social science and computer science could be an innovative and effective strategy for preparing social data scientists in the AI era.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Wright map of curriculum readiness for preparing social data scientists in the AI era.</p>
</caption>
<graphic xlink:href="feduc-10-1657651-g001.tif" mimetype="image" mime-subtype="tiff">
<alt-text content-type="machine-generated">A vertical item-person map that plots the distribution of difficulty levels for the nine skill indicators and the curriculum readiness level of graduate programs. Skills include SQL, AI, Python, ML (Machine Learning), Bayes, Programming, Statistics, Algorithms, and Research. Measures range from four to negative eleven logits. Each hash represents five programs, and each dot represents one to four programs.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="sec10">
<title>Discussion</title>
<p>In terms of the results above, we discuss the observed misalignment between academic preparation and industry demands in the social data science and elaborate on several possible pathways to narrow this gap. The limitations and future directions of the current work are also included in this section.</p>
<sec id="sec11">
<title>The growing misalignment</title>
<p>When we look back at the long-standing conversations around academic preparation versus industry demands (e.g., <xref ref-type="bibr" rid="ref9">Everson, 2022</xref>; <xref ref-type="bibr" rid="ref29">Stone et al., 2009</xref>; <xref ref-type="bibr" rid="ref30">Trauth et al., 1993</xref>), gaps seem to be inevitable. However, the misalignment between social data scientist curricula and industrial demands observed in the current study appears to be substantial than usual. Graduate programs are expected to provide foundational learning opportunities to help students build expertise in data science. Unfortunately, the skill gap was dramatically large and appeared not to be feasibly bridged through work experience alone, as most programs do not offer emerging skills (e.g., machine learning, cloud computing, and programming) required by the data science labor market in the current AI era. This might result in employment challenges for graduates, as well as raise concerns about the value of current higher education.</p>
<p>Moreover, the actual gap could be larger than what the present work observed for two reasons. First, it is a stringent assumption to expect all graduates to master the skills by just taking a course that covers relevant content. Curricula are fundamental but insufficient for students to build expertise in data science, especially in the age of AI (<xref ref-type="bibr" rid="ref28">Spanjaard et al., 2018</xref>). Additionally, the current study investigates the graduate curricula of R1 and R2 universities. When these generally better-resourced institutions in graduate education lag behind, others might struggle even more to provide the necessary training.</p>
<p>The arrival of AI has clearly played a role in enlarging this gap. AI gained more popularity with the prevalent use of Chat-GPT in 2022, but it has permeated data science research and practice (<xref ref-type="bibr" rid="ref7">Dong, 2025</xref>) and impacted the industrial labor market (<xref ref-type="bibr" rid="ref20">Liu et al., 2024</xref>) for decades. As Liu et al. highlighted, since 2010, there has been a growing emphasis on &#x201C;hard&#x201D; technical skills within AI-related data scientist roles. The current study echoes this finding, showing that technical skills are highly demanded. Therefore, addressing this gap, especially in the area of hard skills, is essential for graduates to land jobs in the data science industry.</p>
</sec>
<sec id="sec12">
<title>To narrow the gap: curricula reform or training mode reform?</title>
<p>To narrow the gap, reforming graduate curricula to better align with industrial needs seems to be a necessary step. However, this task could be challenging if we only seek solutions within social science disciplines. College faculty are the main agents to deliver curricula. As <xref ref-type="bibr" rid="ref9">Everson (2022)</xref> noted, even the current faculty in social science commonly struggle with catching up on programming skills and have high demands for related professional development. A shortcut could be hiring new faculty with developed AI expertise (or with computer science backgrounds), but the immediate hiring of new faculty does not seem to be a viable strategy for every university. The existing tenure track system makes faculty turnover slower than in industrial or corporate sectors, which means most programs could take years or decades to accomplish a faculty iteration. By that time, dynamic industrial demands would have shifted again.</p>
<p>Then, reforming the mode of program training could be a more promising path to narrow the identified gap (<xref ref-type="bibr" rid="ref22">Maassen and Cloete, 2006</xref>). The direction of reform may integrate interdisciplinary and technical training by collaborating with other schools (e.g., schools of engineering) that already have experts and talents in AI-related skills. The CMU joint PhD program, which offers students in social science both traditional statistical coursework and technical machine learning content, could be a good example. More importantly, such a mode might be practically scalable because it primarily reorganizes and reconciles already existing resources within a university. In addition to formalizing a joint program, incorporating individualized elective or cognate courses from other disciplines into students&#x2019; CWPs can be an alternative but more flexible strategy. Notably, such an approach often requires more advising support to help students identify suitable courses for their skill development. Meanwhile, it is generally recommended to integrate practical or experiential learning opportunities into programs to further align academic preparation with industry demands (<xref ref-type="bibr" rid="ref16">Kolb, 2014</xref>). Such changes may collectively improve graduates&#x2019; employability and readiness and ensure that data science programs in social science disciplines remain competitive in the AI era.</p>
</sec>
<sec id="sec13">
<title>Limitations and future directions</title>
<p>Given the samples of graduate programs and job posts, research conclusions are limited to social science graduate programs and the social data science industry in the U.S. Future research may examine the generalizability of the study findings in a global setting where non-U.S. graduate programs and job markets are included in the analyses. In particular, it would be beneficial to increase the number of job posts analyzed. The current study used Python-based text analysis to efficiently analyze course webpages and job posts, which may limit the interpretive depth of available data. Certain research findings (e.g., the skill demands of industry and program training coverage) warrant cross-validation through further investigation, such as in-depth interviews with industry leaders or employers in the data science field regarding their specific skill demands for data scientist employees and their perspectives on how to better align graduate training in social science with industry needs. Additionally, the keyword matching approach applied in the current work may assess the course coverage of skills but could be less effective in understanding the depth of training for each skill. Some skills (e.g., AI literacy) cannot be adequately represented or captured by one or two keywords. Future research should consider developing more sophisticated coding schemes to capture related skills based on broader textual contexts.</p>
</sec>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec14">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found at: <ext-link xlink:href="https://osf.io/vmwzq/" ext-link-type="uri">https://osf.io/vmwzq/</ext-link>.</p>
</sec>
<sec sec-type="author-contributions" id="sec15">
<title>Author contributions</title>
<p>YD: Project administration, Visualization, Formal analysis, Methodology, Resources, Investigation, Conceptualization, Writing &#x2013; review &#x0026; editing, Supervision, Software, Writing &#x2013; original draft. DB: Investigation, Software, Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft, Formal analysis, Validation, Data curation. KB: Software, Investigation, Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft, Data curation, Methodology.</p>
</sec>
<sec sec-type="COI-statement" id="sec16">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec17">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was used in the creation of this manuscript. Tools for copy-editing this paper (e.g., Grammarly) may utilize generative AI engines; however, no generative AI applications were used to produce any original content in this paper.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec18">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Boateng</surname><given-names>G. O.</given-names></name> <name><surname>Neilands</surname><given-names>T. B.</given-names></name> <name><surname>Frongillo</surname><given-names>E. A.</given-names></name> <name><surname>Melgar-Qui&#x00F1;onez</surname><given-names>H. R.</given-names></name> <name><surname>Young</surname><given-names>S. L.</given-names></name></person-group> (<year>2018</year>). <article-title>Best practices for developing and validating scales for health, social, and Behavioral research: a primer</article-title>. <source>Front. Public Health</source> <volume>6</volume>:<fpage>149</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpubh.2018.00149</pub-id>, <pub-id pub-id-type="pmid">29942800</pub-id></mixed-citation></ref>
<ref id="ref2"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Bond</surname><given-names>T. G.</given-names></name> <name><surname>Fox</surname><given-names>C. M.</given-names></name></person-group> (<year>2015</year>). <source>Applying the Rasch Model: Fundamental Measurement in the Human Sciences (3<sup>rd</sup> edition)</source>: <publisher-name>Psychology Press</publisher-name>.</mixed-citation></ref>
<ref id="ref3"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Boone</surname><given-names>W. J.</given-names></name> <name><surname>Staver</surname><given-names>J. R.</given-names></name> <name><surname>Yale</surname><given-names>M. S.</given-names></name></person-group> (<year>2014</year>). &#x201C;<article-title>Wright maps: first steps</article-title>&#x201D; in <source>Rasch Analysis in the Human Sciences</source>. eds. <person-group person-group-type="editor"><name><surname>Boone</surname><given-names>W. J.</given-names></name> <name><surname>Staver</surname><given-names>J. R.</given-names></name> <name><surname>Yale</surname><given-names>M. S.</given-names></name></person-group>, <fpage>111</fpage>&#x2013;<lpage>136</lpage>.</mixed-citation></ref>
<ref id="ref4"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Brown</surname><given-names>M. C.</given-names></name></person-group> II. (<year>2013</year>). <article-title>The declining significance of historically black colleges and universities: relevance, reputation, and reality in Obamamerica</article-title>. <source>J. Negro Educ.</source>, <volume>82</volume>, <fpage>3</fpage>&#x2013;<lpage>19</lpage>. doi: <pub-id pub-id-type="doi">10.7709/jnegroeducation.82.1.0003</pub-id></mixed-citation></ref>
<ref id="ref5"><mixed-citation publication-type="other"><person-group person-group-type="author"><collab id="coll1">Carnegie Classification of Institutions of Higher Education</collab></person-group>. <year>2024</year>. <article-title>Carnegie classifications</article-title>. <source>The Carnegie Foundation for the Advancement of Teaching</source>. Available online at: <ext-link xlink:href="https://carnegieclassifications.acenet.edu/" ext-link-type="uri">https://carnegieclassifications.acenet.edu/</ext-link></mixed-citation></ref>
<ref id="ref6"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Costa</surname><given-names>C.</given-names></name> <name><surname>Santos</surname><given-names>M. Y.</given-names></name></person-group> (<year>2017</year>). <article-title>The data scientist profile and its representativeness in the European e-competence framework and the skills framework for the information age</article-title>. <source>Int. J. Inf. Manag.</source> <volume>37</volume>, <fpage>726</fpage>&#x2013;<lpage>734</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ijinfomgt.2017.07.010</pub-id></mixed-citation></ref>
<ref id="ref7"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dong</surname><given-names>Y.</given-names></name></person-group> (<year>2025</year>). <article-title>Pre-uniform measures in the artificial intelligence era</article-title>. <source>Curr. Psychol.</source> <volume>44</volume>, <fpage>7919</fpage>&#x2013;<lpage>7933</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s12144-025-07374-1</pub-id></mixed-citation></ref>
<ref id="ref8"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Donoho</surname><given-names>D.</given-names></name></person-group> (<year>2017</year>). <article-title>50 years of data science</article-title>. <source>J. Comput. Graph. Stat.</source> <volume>26</volume>, <fpage>745</fpage>&#x2013;<lpage>766</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10618600.2017.1384734</pub-id></mixed-citation></ref>
<ref id="ref9"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Everson</surname><given-names>K. C.</given-names></name></person-group> (<year>2022</year>). <article-title>Statistical skills gaps of professors of education at U.S. universities and HBCUs</article-title>. <source>J. Stat. Data Sci. Educ.</source> <volume>30</volume>, <fpage>45</fpage>&#x2013;<lpage>53</lpage>. doi: <pub-id pub-id-type="doi">10.1080/26939169.2022.2034488</pub-id></mixed-citation></ref>
<ref id="ref10"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Gundlach</surname><given-names>E.</given-names></name> <name><surname>Ward</surname><given-names>M. D.</given-names></name></person-group> (<year>2021</year>). <article-title>The data mine: enabling data science across the curriculum</article-title>. <source>J. Stat. Data Sci. Educ.</source> <volume>29</volume>, <fpage>S74</fpage>&#x2013;<lpage>S82</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10691898.2020.1848484</pub-id></mixed-citation></ref>
<ref id="ref11"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hardin</surname><given-names>J.</given-names></name> <name><surname>Horton</surname><given-names>N. J.</given-names></name> <name><surname>Nolan</surname><given-names>D.</given-names></name> <name><surname>Lang</surname><given-names>D. T.</given-names></name></person-group> (<year>2021</year>). <article-title>Computing in the statistics curricula: a 10-year retrospective</article-title>. <source>J. Stat. Data Sci. Educ.</source> <volume>29</volume>, <fpage>S4</fpage>&#x2013;<lpage>S6</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10691898.2020.1862609</pub-id></mixed-citation></ref>
<ref id="ref12"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hijazi</surname><given-names>R.</given-names></name> <name><surname>Alfaki</surname><given-names>I.</given-names></name></person-group> (<year>2020</year>). <article-title>Reforming undergraduate statistics education in the Arab world in the era of information</article-title>. <source>J. Stat. Educ.</source> <volume>28</volume>, <fpage>75</fpage>&#x2013;<lpage>88</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10691898.2019.1705943</pub-id></mixed-citation></ref>
<ref id="ref13"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ho</surname><given-names>A. D.</given-names></name></person-group> (<year>2024</year>). <article-title>Artificial intelligence and educational measurement: opportunities and threats</article-title>. <source>J. Educ. Behav. Stat.</source> <volume>49</volume>, <fpage>715</fpage>&#x2013;<lpage>722</lpage>. doi: <pub-id pub-id-type="doi">10.3102/10769986241248771</pub-id></mixed-citation></ref>
<ref id="ref14"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ismail</surname><given-names>N. A.</given-names></name> <name><surname>Abidin</surname><given-names>W. Z.</given-names></name></person-group> (<year>2016</year>). <article-title>Data scientist skills</article-title>. <source>IOSR J. Mob. Comp. Appl.</source> <volume>3</volume>, <fpage>52</fpage>&#x2013;<lpage>61</lpage>. doi: <pub-id pub-id-type="doi">10.9790/0050-03045261</pub-id></mixed-citation></ref>
<ref id="ref15"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname><given-names>H.</given-names></name> <name><surname>Chen</surname><given-names>C.</given-names></name></person-group> (<year>2022</year>). <article-title>Data science skills and graduate certificates: a quantitative text analysis</article-title>. <source>J. Comput. Inf. Syst.</source> <volume>62</volume>, <fpage>463</fpage>&#x2013;<lpage>479</lpage>. doi: <pub-id pub-id-type="doi">10.1080/08874417.2020.1852628</pub-id></mixed-citation></ref>
<ref id="ref16"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Kolb</surname><given-names>D. A.</given-names></name></person-group> (<year>2014</year>). <source>Experiential Learning: Experience as the Source of Learning and Development</source>. <publisher-loc>Upper Saddle River, NJ</publisher-loc>: <publisher-name>FT press</publisher-name>.</mixed-citation></ref>
<ref id="ref17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Li</surname><given-names>G.</given-names></name> <name><surname>Yuan</surname><given-names>C.</given-names></name> <name><surname>Kamarthi</surname><given-names>S.</given-names></name> <name><surname>Moghaddam</surname><given-names>M.</given-names></name> <name><surname>Jin</surname><given-names>X.</given-names></name></person-group> (<year>2021</year>). <article-title>Data science skills and domain knowledge requirements in the manufacturing industry: a gap analysis</article-title>. <source>J. Manuf. Syst.</source> <volume>60</volume>, <fpage>692</fpage>&#x2013;<lpage>706</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jmsy.2021.07.007</pub-id></mixed-citation></ref>
<ref id="ref18"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Linacre</surname><given-names>J. M.</given-names></name></person-group> <year>2022</year> Winsteps&#x00AE; (version 5.3.1) [computer Software] Winsteps.com</mixed-citation></ref>
<ref id="ref19"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Linacre</surname><given-names>J. M.</given-names></name></person-group> <year>2025</year> Winsteps Rasch Measurement Computer Program User&#x2019;s Guide Winsteps.com</mixed-citation></ref>
<ref id="ref20"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname><given-names>J.</given-names></name> <name><surname>Chen</surname><given-names>K.</given-names></name> <name><surname>Lyu</surname><given-names>W.</given-names></name></person-group> (<year>2024</year>). <article-title>Embracing artificial intelligence in the labour market: the case of statistics</article-title>. <source>Humanit. Soc. Sci. Commun.</source> <volume>11</volume>:<fpage>1112</fpage>. doi: <pub-id pub-id-type="doi">10.1057/s41599-024-03557-6</pub-id></mixed-citation></ref>
<ref id="ref21"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Luan</surname><given-names>H.</given-names></name> <name><surname>Geczy</surname><given-names>P.</given-names></name> <name><surname>Lai</surname><given-names>H.</given-names></name> <name><surname>Gobert</surname><given-names>J.</given-names></name> <name><surname>Yang</surname><given-names>S. J. H.</given-names></name> <name><surname>Ogata</surname><given-names>H.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Challenges and future directions of big data and artificial intelligence in education</article-title>. <source>Front. Psychol.</source> <volume>11</volume>:<fpage>580820</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2020.580820</pub-id>, <pub-id pub-id-type="pmid">33192896</pub-id></mixed-citation></ref>
<ref id="ref22"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Maassen</surname><given-names>P.</given-names></name> <name><surname>Cloete</surname><given-names>N.</given-names></name></person-group> (<year>2006</year>). <article-title>Global reform trends in higher education</article-title>. <source>Transformation in higher education: Global pressures and local realities</source>. eds. <person-group person-group-type="editor"><name><surname>Cloete</surname><given-names>N.</given-names></name> <name><surname>Maassen</surname><given-names>P.</given-names></name> <name><surname>Fehnel</surname><given-names>R.</given-names></name> <name><surname>Moja</surname><given-names>T.</given-names></name> <name><surname>Gibbon</surname><given-names>T.</given-names></name> <name><surname>Perold</surname><given-names>H.</given-names></name></person-group>. (<publisher-loc>The Netherlands</publisher-loc>: <publisher-name>Springer</publisher-name>).</mixed-citation></ref>
<ref id="ref23"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Min</surname><given-names>J.</given-names></name> <name><surname>Song</surname><given-names>X.</given-names></name> <name><surname>Zheng</surname><given-names>S.</given-names></name> <name><surname>King</surname><given-names>C. B.</given-names></name> <name><surname>Deng</surname><given-names>X.</given-names></name> <name><surname>Hong</surname><given-names>Y.</given-names></name></person-group> (<year>2024</year>). <article-title>Applied statistics in the era of artificial intelligence: a review and vision</article-title>. <source>arXiv</source>. doi: <pub-id pub-id-type="doi">10.48550/arXiv.2412.10331</pub-id></mixed-citation></ref>
<ref id="ref24"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Mitchell</surname><given-names>R.</given-names></name></person-group> (<year>2018</year>). <source>Web Scraping with Python: Collecting More Data from the Modern Web</source>. <publisher-loc>Sebastopol, CA</publisher-loc>: <publisher-name>O'Reilly Media</publisher-name>.</mixed-citation></ref>
<ref id="ref25"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Nolan</surname><given-names>D.</given-names></name> <name><surname>Temple Lang</surname><given-names>D.</given-names></name></person-group> (<year>2010</year>). <article-title>Computing in the statistics curricula</article-title>. <source>Am. Stat.</source> <volume>64</volume>, <fpage>97</fpage>&#x2013;<lpage>107</lpage>. doi: <pub-id pub-id-type="doi">10.1198/tast.2010.09132</pub-id></mixed-citation></ref>
<ref id="ref26"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Sarkar</surname><given-names>D.</given-names></name></person-group> (<year>2016</year>). <source>Text Analytics with Python</source>, vol. <volume>2</volume>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Apress</publisher-name>.</mixed-citation></ref>
<ref id="ref27"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Schwab-McCoy</surname><given-names>A.</given-names></name> <name><surname>Baker</surname><given-names>C. M.</given-names></name> <name><surname>Gasper</surname><given-names>R. E.</given-names></name></person-group> (<year>2021</year>). <article-title>Data science in 2020: computing, curricula, and challenges for the next 10 years</article-title>. <source>J. Stat. Data Sci. Educ.</source> <volume>29</volume>, <fpage>S40</fpage>&#x2013;<lpage>S50</lpage>. doi: <pub-id pub-id-type="doi">10.1080/10691898.2020.1851159</pub-id></mixed-citation></ref>
<ref id="ref28"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Spanjaard</surname><given-names>D.</given-names></name> <name><surname>Hall</surname><given-names>T.</given-names></name> <name><surname>Stegemann</surname><given-names>N.</given-names></name></person-group> (<year>2018</year>). <article-title>Experiential learning: helping students to become &#x2018;career-ready&#x2019;</article-title>. <source>Australas. Mark. J.</source> <volume>26</volume>, <fpage>163</fpage>&#x2013;<lpage>171</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.ausmj.2018.04.003</pub-id></mixed-citation></ref>
<ref id="ref29"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stone</surname><given-names>K. B.</given-names></name> <name><surname>Kaminski</surname><given-names>K.</given-names></name> <name><surname>Gloeckner</surname><given-names>G.</given-names></name></person-group> (<year>2009</year>). <article-title>Closing the gap: education requirements of the 21st century production workforce</article-title>. <source>J. Ind. Teach. Educ.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>33</lpage>.</mixed-citation></ref>
<ref id="ref30"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Trauth</surname><given-names>E. M.</given-names></name> <name><surname>Farwell</surname><given-names>D. W.</given-names></name> <name><surname>Lee</surname><given-names>D.</given-names></name></person-group> (<year>1993</year>). <article-title>The IS expectation gap: industry expectations versus academic preparation</article-title>. <source>MIS Q.</source> <volume>17</volume>:<fpage>293</fpage>. doi: <pub-id pub-id-type="doi">10.2307/249773</pub-id></mixed-citation></ref>
<ref id="ref31"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Wright</surname><given-names>B. D.</given-names></name> <name><surname>Linacre</surname><given-names>J. M.</given-names></name></person-group> (<year>1994</year>). <article-title>Reasonable mean-square fit values</article-title>. <source>Rasch Meas. Trans.</source> <volume>8</volume>, <fpage>370</fpage>&#x2013;<lpage>371</lpage>.</mixed-citation></ref>
</ref-list>
<fn-group>
<fn fn-type="custom" custom-type="edited-by" id="fn0001">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1541523/overview">Barbara Jones</ext-link>, Bibliometrica Limited, United Kingdom</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by" id="fn0002">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/610799/overview">Francisco Rafael Trejo-Macotela</ext-link>, Universidad Polit&#x00E9;cnica de Pachuca, Mexico</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1546858/overview">Rany Sam</ext-link>, National University of Battambang, Cambodia</p>
</fn>
</fn-group>
</back>
</article>