<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Public Health</journal-id>
<journal-title>Frontiers in Public Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Public Health</abbrev-journal-title>
<issn pub-type="epub">2296-2565</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpubh.2025.1513744</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Public Health</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Two-stage DRG grouping of cerebral infarction based on comorbidity and complications classification</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Zeng</surname> <given-names>Siyu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Lele</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref rid="aff3" ref-type="aff"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1370628/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Jialing</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>He</surname> <given-names>Xiaozhou</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>School of Logistics, Chengdu University of Information Technology</institution>, <addr-line>Chengdu, Sichuan</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>School of Labor and Human Resources, Renmin University of China</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>Institute for Hospital Management of Henan Province</institution>, <addr-line>Zhengzhou</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>School of Management, Hunan University of Technology and Business</institution>, <addr-line>Changsha, Hunan</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>Business School, Sichuan University</institution>, <addr-line>Chengdu, Sichuan</addr-line>, <country>China</country></aff>
<author-notes>
<fn id="fn0001" fn-type="edited-by"><p>Edited by: Fernando Zanela Ar&#x00EA;as, Baylor Scott and White Research Institute, United States</p></fn>
<fn id="fn0002" fn-type="edited-by"><p>Reviewed by: Georgios Tagarakis, Aristotle University of Thessaloniki, Greece</p>
<p>Fani Tsolaki, Aristotle University of Thessaloniki, Greece</p></fn>
<corresp id="c001">&#x002A;Correspondence: Xiaozhou He, <email>xiaozhouhe126@qq.com</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>28</day>
<month>04</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1513744</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>10</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>03</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2025 Zeng, He, Li and Li.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Zeng, He, Li and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec id="sec1">
<title>Background</title>
<p>Since 2017, cerebral infarction (CI) has become a leading cause of mortality in China, with rising treatment costs posing significant challenges to the healthcare system. The Diagnosis-Related Groups (DRG) payment system has been recognized as a potential solution to curb rising healthcare expenditures. However, in its implementation, China faces considerable hurdles due to its vast geographical size, regional economic disparities, and heterogeneous disease spectrum.</p>
</sec>
<sec id="sec2">
<title>Objective</title>
<p>This study proposes a novel two-stage grouping strategy with a two-stage method tailored to address the local context of western China. The method adaptively accommodates regional variations in disease burden and healthcare resource distribution.</p>
</sec>
<sec id="sec3">
<title>Methods</title>
<p>Using hospitalization data from 111,025 CI patients collected by the Healthcare Security Administration of a western Chinese city between 2016 and 2018 (during the pre-DRG implementation period), we developed a two-stage DRG method. In the first stage, regression analysis identified and prioritized comorbidities and complications that influence medical costs. In the second stage, a decision tree algorithm established standardized classification protocols for DRG grouping, ensuring regional adaptability.</p>
</sec>
<sec id="sec4">
<title>Results</title>
<p>The average hospitalization cost for CI patients was USD$ 1,565, with total expenditures reaching USD$ 1.71&#x202F;million in the target city. By employing this localized two-stage grouping model, the proportion of inter-group variations, as measured by the coefficient of variation (CV), is below 1, reaching 100%, satisfying the technical criteria for DRG categorization. This optimization reduced the number of DRG from 18 to 4. It increased the proportion of groups with CV to &#x003C;0.8 from 67 to 100%, signifying a substantial enhancement in group heterogeneity compared to the existing grouping method, China Healthcare Security Diagnosis-Related Groups (CHS-DRG).</p>
</sec>
<sec id="sec5">
<title>Conclusion</title>
<p>This study demonstrates the effectiveness of our proposed two-stage method using real data. Implementation of this localized method in the target city could result in potential savings of USD$ 8.59&#x202F;million, surpassing the existing CHS-DRG method. These findings suggest that this adaptive method may be a scalable strategy for resource-limited regions undergoing healthcare system reforms.</p>
</sec>
</abstract>
<kwd-group>
<kwd>diagnosis-related groups</kwd>
<kwd>classification</kwd>
<kwd>comorbidity and complications</kwd>
<kwd>cerebral infarction</kwd>
<kwd>two-stage grouping method</kwd>
</kwd-group>
<counts>
<fig-count count="3"/>
<table-count count="9"/>
<equation-count count="1"/>
<ref-count count="24"/>
<page-count count="12"/>
<word-count count="7475"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Health Economics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec6">
<label>1</label>
<title>Introduction</title>
<p>Cerebrovascular disease is the leading cause of death and disability worldwide (<xref ref-type="bibr" rid="ref1">1</xref>), yet advancements in its treatment have increased medical expenditure. In 2017, China&#x2019;s expenditure on cerebrovascular disease treatment reached USD$ 83.83&#x202F;billion, surpassing all other diseases and accounting for 17% of the nation&#x2019;s total disease treatment expenditure&#x2014;equivalent to 0.66% of GDP (<xref ref-type="bibr" rid="ref2">2</xref>). Cerebral infarction (CI) is the most prevalent cerebrovascular condition, with increasing incidence rates and treatment costs significantly exceeding those of many other diseases. This trend imposes direct financial burdens on patients and families while stressing the basic medical insurance system (<xref ref-type="bibr" rid="ref3">3</xref>). Managing the rapid increase of CI-related healthcare costs has become a critical challenge for China&#x2019;s healthcare system, which is also an urgent issue worldwide (<xref ref-type="bibr" rid="ref4">4</xref>).</p>
<p>The Chinese healthcare department has proactively tackled cost containment through payment reforms. In 2018, Beijing implemented the Diagnosis-Related Groups (DRG) payment system. Building upon this pilot initiative, the China Healthcare Security Diagnosis-Related Groups (CHS-DRG) was formally established in 2019 as the national standard. This establishment marks a significant milestone in the development of China&#x2019;s healthcare financing mechanisms, with immediate expansion to 30 major cities (<xref ref-type="bibr" rid="ref5">5</xref>). This CHS-DRG provides standardized grouping protocols and reimbursement benchmarks, enabling systematic cost control while ensuring the quality of care (<xref ref-type="bibr" rid="ref6">6</xref>). The DRG payment system is expected to alleviate the increasing trend of healthcare expenditure. In this context, CI, characterized by a persistent increase in medical costs, serves as a critical use case for refining the DRG grouping method.</p>
<p>The DRG payment system is one of the most cutting-edge methods in global healthcare finance, becoming increasingly favored for reimbursing hospitals amid rising medical expenditure since its inception in 1983 (<xref ref-type="bibr" rid="ref7">7</xref>, <xref ref-type="bibr" rid="ref8">8</xref>). In a DRG payment system, patients who exhibit analogous clinical profiles and necessitate similar levels of care are categorized under identical case types or &#x2018;groups&#x2019;, ensuring that individuals within the same DRG group consume similar healthcare resources (<xref ref-type="bibr" rid="ref9">9</xref>). Consequently, the medical insurance provider pays money based on the DRG group to which the patient belongs and the hospital bears any costs that exceed the payment standard of the group. This framework encourages hospitals to actively engage in cost management and control. However, CHS-DRGs are developed based on data sourced from China&#x2019;s first-tier cities, with a lack of research addressing the specific needs of less developed cities in the western regions. Given China&#x2019;s vast territorial expanse, the economic disparities, and the diverse disease landscape, a one-size-fits-all approach to DRG implementation is impractical for developing cities (<xref ref-type="bibr" rid="ref2">2</xref>, <xref ref-type="bibr" rid="ref10">10</xref>). The challenge lies in making a DRG grouping scheme adapted to the local condition (<xref ref-type="bibr" rid="ref10">10</xref>).</p>
<p>Several studies have highlighted the pivotal role of comorbidity and complications (CCs) in shaping the DRG grouping strategy (<xref ref-type="bibr" rid="ref10">10</xref>). The method for identifying CCs for the CHS-DRG draws inspiration from the DRG of the United States and Australia. This classification process involves the following two steps:</p>
<p>(1) Initially, CCs are ranked in descending order according to their incidence rate. Those with an incidence rate below 5% are merged into a non-CC type.</p>
<p>(2) Subsequently, after their weights are adjusted, taking into account the hospitalization costs and the age of the patients, CCs are classified into three types: major (MCC), moderate (mCC), and non-CC (<xref ref-type="bibr" rid="ref11">11</xref>).</p>
<p>However, the analysis of the data from the target city&#x2019;s data reveals a notable contrast in the incidence rates of CCs of the CHS-DRG. Given the expansive geographical spread and the resultant variation in the disease spectrum, a unified grouping standard like CHS-DRG may not be well suited to the local region. Therefore, there is an urgent need to adapt CC classification criteria to accommodate the unique healthcare characteristics of different cities, ensuring systematic alignment with local disease patterns.</p>
<p>This study examines the rising trends in medical expenditures and introduces a novel two-stage DRG framework designed to mitigate these costs, focusing specifically on a developing city in western China. Our research is centered on CI, which has been observed to have the most rapid increase in medical expenditures. Based on the collected data, the proposed two-stage method is designed to better align with the local context and disease spectrum. In the first stage of the method, regression analysis is used to classify CCs that occur in the city. In the second stage, decision tree ID3, a machine learning algorithm, is used to group patients with similar medical expenses. The performance of the two-stage method is compared with the grouping method of the CHS-DRG. This study fills a gap in the extant literature by focusing on a developing city and proposing feasible rules for the DRG grouping in different regions according to local conditions.</p>
<p>The rest of this article is organized as follows: The &#x201C;Materials and Methods&#x201D; section introduces the materials and methods necessary for developing the two-stage method. The &#x201C;Results&#x201D; section first presents the grouping results derived from the benchmark method CHS-DRGs and then the step-by-step results of our proposed two-stage model. This section also shows a comprehensive comparison of results obtained through these two approaches. The &#x201C;Results&#x201D; section is followed by &#x201C;Discussion&#x201D; and &#x201C;Conclusion&#x201D; sections. The limitation of this study is discussed in the &#x201C;Conclusion&#x201D; section.</p>
</sec>
<sec sec-type="materials|methods" id="sec7">
<label>2</label>
<title>Materials and methods</title>
<p>The research roadmap is shown in <xref ref-type="fig" rid="fig1">Figure 1</xref>.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption><p>Research roadmap.</p></caption>
<graphic xlink:href="fpubh-13-1513744-g001.tif"/>
</fig>
<p>(1) The first step was the research preparation, where we introduced the data sources, data processing, and methods applied.</p>
<p>(2) The second step was descriptive statistics on the data of this sample from the aspects of morbidity, hospitalization resource consumption, etc.</p>
<p>(3) The third step was to show our two-stage method and the grouping results. In this step, the CHS-DRG is compared as the benchmark. Thus, the following two substeps are included:</p>
<list list-type="simple">
<list-item><p>(a) First, we applied the existing CHS-DRGs classification criteria to group patient cases collected from the target area, where CCs were classified with the China Healthcare Security-Technical Specification (CTS) (<xref ref-type="bibr" rid="ref12">12</xref>), as shown in <xref rid="SM1" ref-type="supplementary-material">Supplementary Figure A1</xref>.</p></list-item>
<list-item><p>(b) Second, we developed the novel two-stage method:</p></list-item>
</list>
<list list-type="bullet">
<list-item><p>In the first stage, we constructed seven regression models based on seven diagnoses of CCs with other control variables such as age, sex, and insurance type to identify CCs with a significant impact on medical expenses under each diagnosis.</p></list-item>
<list-item><p>In the second stage, we applied a decision tree algorithm to obtain the grouping plan and improve the adaptability of the DRG, which can contribute to better cost control.</p></list-item>
</list>
<p>(4) In the final step, we evaluated the performance of the two-stage method by comparing it with the CHS-DRGs regarding grouping results and the utilization of medical resource consumption.</p>
<sec id="sec8">
<label>2.1</label>
<title>Patient data</title>
<p>The dataset for this research was rigorously collected from the Healthcare Security Administration of the target city (HSAC) in western China. The data span a period of 3&#x202F;years (2016&#x2013;2018), providing a longitudinal perspective on healthcare trends and patterns. The dataset encompasses a substantial sample size of 111,025 inpatient cases with CI (the International Classification of Diseases, Tenth Revision, Clinical Modification [ICD-10] codes I63.1&#x2013;I63.9) as the main diagnosis from 416 hospitals. The original dataset includes 58 variables, including sex, age, length of stay (LOS) in hospital, cost of hospitalization, insurance type, and seven CCs. We claim that the data are non-public, and all experimental protocols have been approved by the HSAC.</p>
</sec>
<sec id="sec9">
<label>2.2</label>
<title>Data cleaning and variable selection</title>
<p>Initially, 111,025 patient cases were collected, with incomplete data excluded during preprocessing. Further refinement excluded extreme cases with LOS over 60&#x202F;days, aligning with a procedure referenced in Ref. [<xref ref-type="bibr" rid="ref13">13</xref>], resulting in 109,375 cases. Considering the annual medical insurance reimbursement limit of USD$ 22,189 by the city&#x2019;s policy, cases with hospitalization expenditures exceeding this limit were treated as outliers and excluded, leading to a final refined dataset of 109,314 cases.</p>
<p>Next, in addition to CCs, this study included six control variables resulting from our previous study (<xref ref-type="bibr" rid="ref3">3</xref>): sex, age, LOS, hospital level, insurance type, and payment level.</p>
</sec>
<sec id="sec10">
<label>2.3</label>
<title>Grouping method</title>
<p>CCs have a significant impact on medical expenditures (<xref ref-type="bibr" rid="ref14">14</xref>). An effective classification of CCs is vital to establishing a scientific and reasonable DRG grouping plan (<xref ref-type="bibr" rid="ref15">15</xref>). In the CHS-DRG, CCs with higher incidence rates are ranked higher when classifying CCs. However, CCs with high incidence rates do not always produce high medical expenses. Since the goal of implementing the DRGs is to control medical expenses, CCs should be classified according to their impact on medical expenses. For this purpose, regression analysis was adopted in the first stage of the method.</p>
<p>Regression analysis is a statistical method commonly used to determine whether there is a dependence between two variables, and the degree of dependence can be indicated by the coefficients (<xref ref-type="bibr" rid="ref16">16</xref>). Therefore, the <italic>p</italic>-values of the variables were used to test the significance of CCs. The regression coefficient of significant CCs was used to quantify their impact on medical expenses. Specifically, we constructed seven regression models corresponding to the seven diagnoses on CCs, as suggested by the staff of HSAC that the principal diagnosis, i.e., CI, and seven primary diagnoses on CCs are valuable if the patient has multiple CCs. We analyzed the significance of CCs and obtained the regression coefficients for each model. Those CCs that were significant (<italic>p</italic>&#x202F;&#x003C;&#x202F;0.05) in at least one model were selected and then ranked with their regression coefficients.</p>
<p>Description of the models are described in <xref ref-type="table" rid="tab1">Table 1</xref>, and the seven regression models, indexed by <inline-formula><mml:math id="M1"><mml:mi>i</mml:mi></mml:math></inline-formula> from 1 to 7, respectively, are shown as <xref ref-type="disp-formula" rid="EQ1">Equation (1)</xref>:</p>
<disp-formula id="EQ1"><label>(1)</label><mml:math id="M2"><mml:mi>y</mml:mi><mml:mo>=</mml:mo><mml:msubsup><mml:mstyle displaystyle="true"><mml:mo stretchy="true">&#x2211;</mml:mo></mml:mstyle><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:msub><mml:mi>J</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:msubsup><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2217;</mml:mo><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mstyle displaystyle="true"><mml:munderover><mml:mo stretchy="true">&#x2211;</mml:mo><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>N</mml:mi></mml:munderover></mml:mstyle><mml:msub><mml:mi>&#x03B3;</mml:mi><mml:mi>n</mml:mi></mml:msub><mml:mo>&#x2217;</mml:mo><mml:msub><mml:mtext>control</mml:mtext><mml:mi>n</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mi>e</mml:mi><mml:mo>,</mml:mo><mml:mspace width="0.5em"/><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mo>&#x2026;</mml:mo><mml:mo>,</mml:mo><mml:mn>7</mml:mn></mml:math></disp-formula>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption><p>Description of the regression models.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" colspan="3">Input</th>
<th align="center" valign="top" colspan="2">Output</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Dependent variable indicating medical expense</td>
<td align="left" valign="middle">Independent variable indicating CCs</td>
<td align="left" valign="middle">Control variable indicating age</td>
<td align="left" valign="middle" rowspan="2">Regression coefficient <inline-formula><mml:math id="M3"><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula></td>
<td align="left" valign="middle" rowspan="2"><italic>p</italic>-value of <inline-formula><mml:math id="M4"><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula></td>
</tr>
<tr>
<td align="left" valign="middle"><inline-formula><mml:math id="M5"><mml:mi>y</mml:mi></mml:math></inline-formula></td>
<td align="left" valign="middle"><inline-formula><mml:math id="M6"><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2208;</mml:mo><mml:mfenced open="{" close="}" separators=","><mml:mn>0</mml:mn><mml:mn>1</mml:mn></mml:mfenced></mml:math></inline-formula></td>
<td align="left" valign="middle"><inline-formula><mml:math id="M7"><mml:msub><mml:mtext>control</mml:mtext><mml:mi>n</mml:mi></mml:msub></mml:math></inline-formula></td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In these models, the dependent variable <inline-formula><mml:math id="M8"><mml:mi>y</mml:mi></mml:math></inline-formula> represents the medical expense of each patient. The independent variable <inline-formula><mml:math id="M9"><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> corresponds to the <inline-formula><mml:math id="M10"><mml:mi>j</mml:mi></mml:math></inline-formula>th CC in the <inline-formula><mml:math id="M11"><mml:mi>i</mml:mi></mml:math></inline-formula>th diagnosis/model, which is a 0,1-variable indicating whether a patient has this CC. The number of CCs in each diagnosis <inline-formula><mml:math id="M12"><mml:mi>i</mml:mi></mml:math></inline-formula> is denoted as <inline-formula><mml:math id="M13"><mml:msub><mml:mi>J</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:math></inline-formula>. The regression coefficient of <inline-formula><mml:math id="M14"><mml:msub><mml:mi>x</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> is <inline-formula><mml:math id="M15"><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>. These seven models also include <inline-formula><mml:math id="M16"><mml:mi>N</mml:mi><mml:mo>=</mml:mo><mml:mn>6</mml:mn></mml:math></inline-formula> control variables, <inline-formula><mml:math id="M17"><mml:msub><mml:mtext>control</mml:mtext><mml:mi>n</mml:mi></mml:msub><mml:mspace width="thickmathspace"/><mml:mfenced open="(" close=")"><mml:mrow><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mo>&#x2026;</mml:mo><mml:mo>,</mml:mo><mml:mi>N</mml:mi></mml:mrow></mml:mfenced></mml:math></inline-formula>, representing age and sex, among others, as discussed in the &#x201C;Grouping Results using CHS-DRG as the benchmark&#x201D; section. The coefficient associated with <inline-formula><mml:math id="M18"><mml:msub><mml:mtext>control</mml:mtext><mml:mi>n</mml:mi></mml:msub></mml:math></inline-formula> is <inline-formula><mml:math id="M19"><mml:msub><mml:mi>&#x03B3;</mml:mi><mml:mi>n</mml:mi></mml:msub></mml:math></inline-formula> and <inline-formula><mml:math id="M20"><mml:mi>e</mml:mi></mml:math></inline-formula> is the standard error.</p>
<p>The identified CCs were then classified into three types: Type I, Type II, and Type IIII. For each model, the top 30% of CCs were considered to be major, i.e., MCC; the CCs ranked 30&#x2013;60% were considered moderate, i.e., mCC; and the last 40% were non-CC.</p>
<p>Based on the classification of CCs, patients with different CCs were classified into three types of priorities according to their type of CCs. As shown in <xref ref-type="table" rid="tab2">Table 2</xref>, if a patient has at least one MCC among the seven primary diagnoses, then they are considered the highest priority, that is, type I; if they do not have any MCC but has at least one mCC, then they are supposed to be type II; otherwise, they belong to type III.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption><p>Patient type based on CCs.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Patient priority</th>
<th align="center" valign="top" colspan="3">Classification of CCs</th>
</tr>
<tr>
<th align="center" valign="top">MCCs</th>
<th align="center" valign="top">mCC</th>
<th align="center" valign="top">Non-CC</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Type I (severity)</td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i001.tif"/></td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i002.tif"/></td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i002.tif"/></td>
</tr>
<tr>
<td align="left" valign="top">Type II (general)</td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i003.tif"/></td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i001.tif"/></td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i002.tif"/></td>
</tr>
<tr>
<td align="left" valign="top">Type III (slight)</td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i003.tif"/></td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i003.tif"/></td>
<td align="center" valign="top"><inline-graphic xlink:href="fpubh-13-1513744-i002.tif"/></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><inline-graphic xlink:href="fpubh-13-1513744-i001.tif"/>: Has this type of CCs. <inline-graphic xlink:href="fpubh-13-1513744-i003.tif"/>: Does not have this type of CCs. <inline-graphic xlink:href="fpubh-13-1513744-i002.tif"/>: Has/has not had this type of CCs.</p>
</table-wrap-foot>
</table-wrap>
<p>After selecting and ranking CCs, the decision tree classifier was applied. The decision tree classifier has been used in various clinical studies (<xref ref-type="bibr" rid="ref17">17</xref>). An important advantage of this method is that it does not require the selection of explanatory variables prior to modeling. Furthermore, their non-parametric feature allows them to deal with missing values, and they are robust to the presence of outliers. In the second stage of the method, a decision tree, i.e., the iterative dichotomiser 3 (ID3) algorithm, was used to establish the grouping of DRG. The training set was grouped, and the effect of grouping was evaluated using the test set&#x2019;s data. We conducted 10 random trials using data samples, and the results of these 10 trials were consistent, indicating the stable performance of the algorithm.</p>
<p>All analyses discussed above were performed using the RStudio 4.0.2, an open source software provided by Posit (<xref ref-type="bibr" rid="ref18">18</xref>).</p>
</sec>
</sec>
<sec sec-type="results" id="sec11">
<label>3</label>
<title>Results</title>
<p>In the &#x201C;General Information about Inpatient Medical Expenditure&#x201D; section, we summarize the general characteristics of the participants in the study and the results of single factor analysis. In the &#x201C;Grouping Results using CHS-DRG as the benchmark&#x201D; section, the grouping results of CHS-DRGs are presented. The grouping results of the proposed two-stage method are shown in the &#x201C;Grouping results using the two-stage method&#x201D; section. Finally, the performance of the two algorithms is presented in the &#x201C;Comparison of the performance and medical expenditure overuse&#x201D; section.</p>
<sec id="sec12">
<label>3.1</label>
<title>General information about inpatient medical expenditure</title>
<p>From 2016 to 2018, after excluding outliers, a total of USD$ 170.94&#x202F;million in hospitalization expenses were incurred for patients with stroke medical insurance, with average expenses of USD$ 1564.342. Among the patients, 54,115 (49.50%) were male and 55,199 (50.50%) were female. There were 68,498 (62.66%) urban employees and 40,816 (37.34%) urban and rural residents. As the older adults (over 65&#x202F;years of age) accounted for the majority of patients, the older adult population was further divided into three subgroups based on age: 65&#x2013;75, 75&#x2013;85, and over 85&#x202F;years. There were 2,080, 27,637, 35,512, 34,175, and 9,874 patients of the ages below 65, 65&#x2013;75, 75&#x2013;85, and over 85&#x202F;years of age in the target city, accounting for 1.9, 25.32, 32.49, 31.26, and 9.03% of the population included in the study, respectively. Among the patients, 37.97% were hospitalized for less than 9&#x202F;days, 20.97% for 9&#x2013;12&#x202F;days, and 41.06% for more than 12&#x202F;days, as shown in <xref ref-type="table" rid="tab3">Table 3</xref>.</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption><p>General information about inpatient medical expenditure of patients with CI.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Variable definitions</th>
<th align="left" valign="top">Assignment of influencing factors</th>
<th align="center" valign="top">Simple size</th>
<th align="center" valign="top">Proportion (%)</th>
<th align="center" valign="top">Median cost (USD)</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="2">Sex</td>
<td align="left" valign="middle">Male</td>
<td align="char" valign="middle" char=",">54,115</td>
<td align="char" valign="middle" char=".">49.50</td>
<td align="char" valign="middle" char=".">1182.30</td>
</tr>
<tr>
<td align="left" valign="middle">Female employee insurance</td>
<td align="char" valign="middle" char=",">55,199</td>
<td align="char" valign="middle" char=".">50.50</td>
<td align="char" valign="middle" char=".">1117.56</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Type of insurance</td>
<td align="left" valign="middle">Urban and rural resident insurance</td>
<td align="char" valign="middle" char=",">68,498</td>
<td align="char" valign="middle" char=".">62.66</td>
<td align="char" valign="middle" char=".">1305.99</td>
</tr>
<tr>
<td align="left" valign="middle">Rural</td>
<td align="char" valign="middle" char=",">40,816</td>
<td align="char" valign="middle" char=".">37.34</td>
<td align="char" valign="middle" char=".">880.29</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">Level of hospital</td>
<td align="left" valign="middle">Primary hospital</td>
<td align="char" valign="middle" char=",">21,463</td>
<td align="char" valign="middle" char=".">19.63</td>
<td align="char" valign="middle" char=".">435.80</td>
</tr>
<tr>
<td align="left" valign="middle">Secondary hospital</td>
<td align="char" valign="middle" char=",">35,771</td>
<td align="char" valign="middle" char=".">32.72</td>
<td align="char" valign="middle" char=".">1032.74</td>
</tr>
<tr>
<td align="left" valign="middle">Tertiary hospital</td>
<td align="char" valign="middle" char=",">52,080</td>
<td align="char" valign="middle" char=".">47.64</td>
<td align="char" valign="middle" char=".">1695.10</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="6">Level of charge</td>
<td align="left" valign="middle">Grade A tertiary hospital</td>
<td align="char" valign="middle" char=",">29,946</td>
<td align="char" valign="middle" char=".">27.39</td>
<td align="char" valign="middle" char=".">2076.27</td>
</tr>
<tr>
<td align="left" valign="middle">Grade B tertiary hospital</td>
<td align="char" valign="middle" char=",">22,130</td>
<td align="char" valign="middle" char=".">20.24</td>
<td align="char" valign="middle" char=".">1269.70</td>
</tr>
<tr>
<td align="left" valign="middle">Grade A secondary hospital</td>
<td align="char" valign="middle" char=",">28,595</td>
<td align="char" valign="middle" char=".">26.16</td>
<td align="char" valign="middle" char=".">1093.57</td>
</tr>
<tr>
<td align="left" valign="middle">Grade B secondary hospital</td>
<td align="char" valign="middle" char=",">5,462</td>
<td align="char" valign="middle" char=".">5.00</td>
<td align="char" valign="middle" char=".">707.55</td>
</tr>
<tr>
<td align="left" valign="middle">Grade B tertiary hospital, up 10%</td>
<td align="char" valign="middle" char=",">3,111</td>
<td align="char" valign="middle" char=".">2.85</td>
<td align="char" valign="middle" char=".">878.86</td>
</tr>
<tr>
<td align="left" valign="middle">Grade B tertiary hospital, down 10%</td>
<td align="char" valign="middle" char=",">20,070</td>
<td align="char" valign="middle" char=".">18.36</td>
<td align="char" valign="middle" char=".">424.35</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="5">Age</td>
<td align="left" valign="middle">Age&#x202F;&#x2264;&#x202F;45&#x202F;years</td>
<td align="char" valign="middle" char=",">2,080</td>
<td align="char" valign="middle" char=".">1.90</td>
<td align="char" valign="middle" char=".">1318.99</td>
</tr>
<tr>
<td align="left" valign="middle">Age between 45 and 65&#x202F;years</td>
<td align="char" valign="middle" char=",">27,673</td>
<td align="char" valign="middle" char=".">25.32</td>
<td align="char" valign="middle" char=".">1123.59</td>
</tr>
<tr>
<td align="left" valign="middle">Age between 65 and 75&#x202F;years</td>
<td align="char" valign="middle" char=",">35,512</td>
<td align="char" valign="middle" char=".">32.49</td>
<td align="char" valign="middle" char=".">1126.75</td>
</tr>
<tr>
<td align="left" valign="middle">Age between 75 and 85&#x202F;years</td>
<td align="char" valign="middle" char=",">34,175</td>
<td align="char" valign="middle" char=".">31.26</td>
<td align="char" valign="middle" char=".">1165.11</td>
</tr>
<tr>
<td align="left" valign="middle">Age&#x202F;&#x2265;&#x202F;85&#x202F;years</td>
<td align="char" valign="middle" char=",">9,874</td>
<td align="char" valign="middle" char=".">9.03</td>
<td align="char" valign="middle" char=".">1206.43</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">LOS</td>
<td align="left" valign="middle">&#x2264;9&#x202F;days</td>
<td align="char" valign="middle" char=",">41,510</td>
<td align="char" valign="middle" char=".">37.97</td>
<td align="char" valign="middle" char=".">727.14</td>
</tr>
<tr>
<td align="left" valign="middle">9&#x202F;~&#x202F;12d</td>
<td align="char" valign="middle" char=",">22,920</td>
<td align="char" valign="middle" char=".">20.97</td>
<td align="char" valign="middle" char=".">1125.06</td>
</tr>
<tr>
<td align="left" valign="middle">&#x2265;12&#x202F;days</td>
<td align="char" valign="middle" char=",">44,884</td>
<td align="char" valign="middle" char=".">41.06</td>
<td align="char" valign="middle" char=".">1777.6</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="3">CCs</td>
<td align="left" valign="middle">MCC</td>
<td align="char" valign="middle" char=",">18,469</td>
<td align="char" valign="middle" char=".">16.90</td>
<td align="char" valign="middle" char=".">1576.95</td>
</tr>
<tr>
<td align="left" valign="middle">CC</td>
<td align="char" valign="middle" char=",">75,662</td>
<td align="char" valign="middle" char=".">69.22</td>
<td align="char" valign="middle" char=".">1129.17</td>
</tr>
<tr>
<td align="left" valign="middle">Non-CC</td>
<td align="char" valign="middle" char=",">15,183</td>
<td align="char" valign="middle" char=".">13.89</td>
<td align="char" valign="middle" char=".">795.10</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec13">
<label>3.2</label>
<title>Grouping results using CHS-DRG as the benchmark</title>
<p>To mitigate the skewness in hospitalization cost distributions, a natural logarithmic transformation was applied to normalize the data. As reported in <xref ref-type="table" rid="tab4">Table 4</xref>, all the subdivided DRGs have a CV below 1, fulfilling the criteria for effective grouping. <xref ref-type="fig" rid="fig2">Figure 2</xref> illustrates four key indicators: Enrollment quantity, mean cost (in USD$), standard deviation (SD), and weight. The weights ranged from a minimum of 0.20 (the 16th group) to a maximum of 2.12 (the 9th group), reflecting substantial variation in resource consumption across the disease group. Group 16, characterized by the lowest resource utilization, had an average cost of USD$ 319.18 and included 3,258 patients, accounting for 2.9% of the total cohort. Conversely, the 9th group, including patients with serious CCs in tertiary hospitals, spends the highest cost and has the highest average cost of USD$ 3,321.86.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption><p>Grouping results and expenses of each group based on CHS-DRG.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Group number</th>
<th align="center" valign="top">Enrollment quantity</th>
<th align="center" valign="top">Mean</th>
<th align="center" valign="top">SD</th>
<th align="center" valign="top">CV</th>
<th align="center" valign="top">IQR</th>
<th align="center" valign="top">P75</th>
<th align="center" valign="top">Weight</th>
<th align="center" valign="top">Upper limit of expense</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">1</td>
<td align="char" valign="middle" char=",">8,124</td>
<td align="char" valign="middle" char=",">690.06</td>
<td align="char" valign="middle" char=".">429.50</td>
<td align="char" valign="middle" char=".">0.62</td>
<td align="char" valign="middle" char=".">408.76</td>
<td align="char" valign="middle" char=".">878.74</td>
<td align="char" valign="middle" char=".">0.44</td>
<td align="char" valign="middle" char=".">1,491.88</td>
</tr>
<tr>
<td align="left" valign="middle">2</td>
<td align="char" valign="middle" char=",">16,678</td>
<td align="char" valign="middle" char=",">1,221.77</td>
<td align="char" valign="middle" char=".">696.15</td>
<td align="char" valign="middle" char=".">0.57</td>
<td align="char" valign="middle" char=".">812.78</td>
<td align="char" valign="middle" char=".">1,475.49</td>
<td align="char" valign="middle" char=".">0.78</td>
<td align="char" valign="middle" char=".">2,694.67</td>
</tr>
<tr>
<td align="left" valign="middle">3</td>
<td align="char" valign="middle" char=",">23,599</td>
<td align="char" valign="middle" char=",">2,254.00</td>
<td align="char" valign="middle" char=".">1,765.26</td>
<td align="char" valign="middle" char=".">0.78</td>
<td align="char" valign="middle" char=".">1,226.55</td>
<td align="char" valign="middle" char=".">2,682.47</td>
<td align="char" valign="middle" char=".">1.44</td>
<td align="char" valign="middle" char=".">4,522.30</td>
</tr>
<tr>
<td align="left" valign="middle">4</td>
<td align="char" valign="middle" char=",">6,806</td>
<td align="char" valign="middle" char=",">393.12</td>
<td align="char" valign="middle" char=".">260.54</td>
<td align="char" valign="middle" char=".">0.66</td>
<td align="char" valign="middle" char=".">221.21</td>
<td align="char" valign="middle" char=".">495.97</td>
<td align="char" valign="middle" char=".">0.25</td>
<td align="char" valign="middle" char=".">827.80</td>
</tr>
<tr>
<td align="left" valign="middle">5</td>
<td align="char" valign="middle" char=",">9,034</td>
<td align="char" valign="middle" char=",">1,016.63</td>
<td align="char" valign="middle" char=".">635.00</td>
<td align="char" valign="middle" char=".">0.62</td>
<td align="char" valign="middle" char=".">626.96</td>
<td align="char" valign="middle" char=".">1,244.75</td>
<td align="char" valign="middle" char=".">0.65</td>
<td align="char" valign="middle" char=".">2,185.20</td>
</tr>
<tr>
<td align="left" valign="middle">6</td>
<td align="char" valign="middle" char=",">11,421</td>
<td align="char" valign="middle" char=",">1,722.86</td>
<td align="char" valign="middle" char=".">1,414.44</td>
<td align="char" valign="middle" char=".">0.82</td>
<td align="char" valign="middle" char=".">950.34</td>
<td align="char" valign="middle" char=".">2,051.82</td>
<td align="char" valign="middle" char=".">1.10</td>
<td align="char" valign="middle" char=".">3,477.33</td>
</tr>
<tr>
<td align="left" valign="middle">7</td>
<td align="char" valign="middle" char=",">1,181</td>
<td align="char" valign="middle" char=",">897.35</td>
<td align="char" valign="middle" char=".">702.25</td>
<td align="char" valign="middle" char=".">0.78</td>
<td align="char" valign="middle" char=".">508.78</td>
<td align="char" valign="middle" char=".">1,097.60</td>
<td align="char" valign="middle" char=".">0.57</td>
<td align="char" valign="middle" char=".">1,860.78</td>
</tr>
<tr>
<td align="left" valign="middle">8</td>
<td align="char" valign="middle" char=",">4,171</td>
<td align="char" valign="middle" char=",">1,716.34</td>
<td align="char" valign="middle" char=".">1,556.73</td>
<td align="char" valign="middle" char=".">0.91</td>
<td align="char" valign="middle" char=".">951.45</td>
<td align="char" valign="middle" char=".">1,910.65</td>
<td align="char" valign="middle" char=".">1.10</td>
<td align="char" valign="middle" char=".">3,337.84</td>
</tr>
<tr>
<td align="left" valign="middle">9</td>
<td align="char" valign="middle" char=",">6,947</td>
<td align="char" valign="middle" char=",">3,321.90</td>
<td align="char" valign="middle" char=".">2,987.84</td>
<td align="char" valign="middle" char=".">0.90</td>
<td align="char" valign="middle" char=".">1,509.59</td>
<td align="char" valign="middle" char=".">3,979.61</td>
<td align="char" valign="middle" char=".">2.12</td>
<td align="char" valign="middle" char=".">6,244.00</td>
</tr>
<tr>
<td align="left" valign="middle">10</td>
<td align="char" valign="middle" char=",">595</td>
<td align="char" valign="middle" char=",">509.94</td>
<td align="char" valign="middle" char=".">387.42</td>
<td align="char" valign="middle" char=".">0.76</td>
<td align="char" valign="middle" char=".">265.23</td>
<td align="char" valign="middle" char=".">624.46</td>
<td align="char" valign="middle" char=".">0.33</td>
<td align="char" valign="middle" char=".">1,022.32</td>
</tr>
<tr>
<td align="left" valign="middle">11</td>
<td align="char" valign="middle" char=",">1,974</td>
<td align="char" valign="middle" char=",">1,287.61</td>
<td align="char" valign="middle" char=".">1,159.70</td>
<td align="char" valign="middle" char=".">0.90</td>
<td align="char" valign="middle" char=".">698.37</td>
<td align="char" valign="middle" char=".">1,477.42</td>
<td align="char" valign="middle" char=".">0.82</td>
<td align="char" valign="middle" char=".">2,524.98</td>
</tr>
<tr>
<td align="left" valign="middle">12</td>
<td align="char" valign="middle" char=",">3,601</td>
<td align="char" valign="middle" char=",">2,464.50</td>
<td align="char" valign="middle" char=".">2,390.28</td>
<td align="char" valign="middle" char=".">0.97</td>
<td align="char" valign="middle" char=".">1,150.48</td>
<td align="char" valign="middle" char=".">2,825.83</td>
<td align="char" valign="middle" char=".">1.58</td>
<td align="char" valign="middle" char=".">4,551.56</td>
</tr>
<tr>
<td align="left" valign="middle">13</td>
<td align="char" valign="middle" char=",">1,499</td>
<td align="char" valign="middle" char=",">483.94</td>
<td align="char" valign="middle" char=".">384.73</td>
<td align="char" valign="middle" char=".">0.79</td>
<td align="char" valign="middle" char=".">239.80</td>
<td align="char" valign="middle" char=".">619.81</td>
<td align="char" valign="middle" char=".">0.31</td>
<td align="char" valign="middle" char=".">979.52</td>
</tr>
<tr>
<td align="left" valign="middle">14</td>
<td align="char" valign="middle" char=",">2,113</td>
<td align="char" valign="middle" char=",">999.32</td>
<td align="char" valign="middle" char=".">683.14</td>
<td align="char" valign="middle" char=".">0.68</td>
<td align="char" valign="middle" char=".">601.24</td>
<td align="char" valign="middle" char=".">1,195.92</td>
<td align="char" valign="middle" char=".">0.64</td>
<td align="char" valign="middle" char=".">2,097.78</td>
</tr>
<tr>
<td align="left" valign="middle">15</td>
<td align="char" valign="middle" char=",">4,186</td>
<td align="char" valign="middle" char=",">2,012.63</td>
<td align="char" valign="middle" char=".">1,859.25</td>
<td align="char" valign="middle" char=".">0.92</td>
<td align="char" valign="middle" char=".">1,028.90</td>
<td align="char" valign="middle" char=".">2,340.47</td>
<td align="char" valign="middle" char=".">1.29</td>
<td align="char" valign="middle" char=".">3,883.82</td>
</tr>
<tr>
<td align="left" valign="middle">16</td>
<td align="char" valign="middle" char=",">3,258</td>
<td align="char" valign="middle" char=",">319.17</td>
<td align="char" valign="middle" char=".">223.00</td>
<td align="char" valign="middle" char=".">0.70</td>
<td align="char" valign="middle" char=".">164.41</td>
<td align="char" valign="middle" char=".">423.00</td>
<td align="char" valign="middle" char=".">0.20</td>
<td align="char" valign="middle" char=".">669.62</td>
</tr>
<tr>
<td align="left" valign="middle">17</td>
<td align="char" valign="middle" char=",">1,801</td>
<td align="char" valign="middle" char=",">827.55</td>
<td align="char" valign="middle" char=".">605.01</td>
<td align="char" valign="middle" char=".">0.73</td>
<td align="char" valign="middle" char=".">489.66</td>
<td align="char" valign="middle" char=".">1,025.23</td>
<td align="char" valign="middle" char=".">0.53</td>
<td align="char" valign="middle" char=".">1,759.72</td>
</tr>
<tr>
<td align="left" valign="middle">18</td>
<td align="char" valign="middle" char=",">2,326</td>
<td align="char" valign="middle" char=",">1,498.25</td>
<td align="char" valign="middle" char=".">1,422.46</td>
<td align="char" valign="middle" char=".">0.95</td>
<td align="char" valign="middle" char=".">766.26</td>
<td align="char" valign="middle" char=".">1,782.33</td>
<td align="char" valign="middle" char=".">0.96</td>
<td align="char" valign="middle" char=".">2,931.73</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>CV, coefficient of variation; IQR, interquartile range; SD, standard deviation.</p>
</table-wrap-foot>
</table-wrap>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption><p>Grouping results and expenses of each group based on CHS-DRG.</p></caption>
<graphic xlink:href="fpubh-13-1513744-g002.tif"/>
</fig>
</sec>
<sec id="sec14">
<label>3.3</label>
<title>Grouping results using the two-stage method</title>
<p>The grouping results presented in the previous section categorizes all patient cases into 18 distinct groups. Notably, six of these groups have a CV above 0.8, suggesting the necessity for refining the CHS-DRG framework. This finding is corroborated by the National Healthcare Security Administration of China, which has identified the deficiency in applying CHS-DRG across the country (<xref ref-type="bibr" rid="ref19">19</xref>). Scholars widely agree that enhancing the management of CCs is crucial for developing a DRG system tailored to local characteristics (<xref ref-type="bibr" rid="ref15">15</xref>).</p>
<p>To improve the CHS-DRG grouping method, a two-stage grouping method is proposed to regroup 109,314 patient cases with CI in the target city, which mainly included the following steps:</p>
<p>First stage: To (1) identify the important CCs affecting hospitalization costs and (2) classify significant CCs into three different levels to replace the three severe levels of CCs in the CHS-DRG.</p>
<p>Second stage: To (1) prioritize the patient cases according to the important CCs after classification and (2) regroup cases using the decision tree, algorithm ID3.</p>
<sec id="sec15">
<label>3.3.1</label>
<title>First stage: classification of CCs</title>
<p>In the first stage, regression analysis is used to determine whether there is a dependence between the cost and CCs, and then, the regression coefficients are used to rank the degree of dependence. The results of the seven regression models are reported in <xref rid="SM1" ref-type="supplementary-material">Supplementary Tables A1&#x2013;A7</xref>, and 641 significant CCs in total were identified and ranked. For example, as <xref rid="SM1" ref-type="supplementary-material">Supplementary Table A1</xref> shows, G97 is one of the CCs in the regression model 1. The regression coefficient of G97 is 99,142.41 and the <italic>p</italic>-value was &#x003C;0.05. Therefore, G97 is marked as a significant CC.</p>
<p>As indicated in Section 2, the identified 641 CCs were then classified into three types: MCC, mCC, and non-CC. Part of the classification results of CCs are listed in <xref ref-type="table" rid="tab5">Table 5</xref> and the complete results for the 641 CCs are listed in <xref rid="SM1" ref-type="supplementary-material">Supplementary Table A8</xref>. For example, the regression coefficient of G97 in model 1 ranks in the top 30%, and therefore, G97 is considered an MCC in our new classification of CCs.</p>
<table-wrap position="float" id="tab5">
<label>Table 5</label>
<caption><p>Part of classification results of CCs of the seven regression models.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Classification</th>
<th align="left" valign="top">ICD code for diseases</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">MCC code (top 30%)</td>
<td align="left" valign="middle">G97, T06, B37, F43, A40, D46, B95, R23, M88&#x2026;</td>
</tr>
<tr>
<td align="left" valign="middle">mCC code (30&#x2013;60%)</td>
<td align="left" valign="middle">J95, B44, Q12, I12, B49, S73, A41, I85, J12, T82&#x2026;</td>
</tr>
<tr>
<td align="left" valign="middle">non-CC code (60&#x2013;100%)</td>
<td align="left" valign="middle">Z98, L88, G92, C25, D73, R57, D84, J69, J96, E16&#x2026;</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec16">
<label>3.3.2</label>
<title>Second stage: grouping results using the algorithm ID3</title>
<p>Employing the identified CCs and other control variables as grouping factors, along with hospitalization expense as the dependent variable, we identified the patients&#x2019; type following the rule shown in <xref ref-type="table" rid="tab2">Table 2</xref>. Then, a two-stage grouping method was developed based on the algorithm ID3. After merging patient cases with less than 200, the method resulted in four distinct groups. As detailed in <xref ref-type="table" rid="tab6">Table 6</xref> and <xref ref-type="fig" rid="fig3">Figure 3</xref>, all groups exhibit a CV below 1, signifying a low inner group variation and adherence to DRG requirements. In the meantime, there is a notable disparity in resource consumption and medical expenses among the groups. For example, the 1st group, with the smallest weight of 0.52, comprises 28,643 patients with an average medical expense of USD$ 625.10. In contrast, the 4th group, with the highest weight of 2.57, includes 6,411 patients with an average medical expense of USD$ 3,443.37.</p>
<table-wrap position="float" id="tab6">
<label>Table 6</label>
<caption><p>Grouping results of the two-stage method.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Group number</th>
<th align="center" valign="top">Enrollment quantity</th>
<th align="center" valign="top">Mean</th>
<th align="center" valign="top">SD</th>
<th align="center" valign="top">CV</th>
<th align="center" valign="top">IQR</th>
<th align="center" valign="top">P75</th>
<th align="center" valign="top">Weight</th>
<th align="center" valign="top">Upper limit of expense</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">1</td>
<td align="char" valign="middle" char=",">28,643</td>
<td align="char" valign="middle" char=",">625.10</td>
<td align="char" valign="middle" char=",">492.09</td>
<td align="char" valign="middle" char=".">0.79</td>
<td align="char" valign="middle" char=",">301.84</td>
<td align="char" valign="top" char=",">820.48</td>
<td align="char" valign="middle" char=".">0.52</td>
<td align="char" valign="top" char=",">1,273.24</td>
</tr>
<tr>
<td align="left" valign="middle">2</td>
<td align="char" valign="middle" char=",">50,725</td>
<td align="char" valign="middle" char=",">1,412.13</td>
<td align="char" valign="middle" char=",">1,118.14</td>
<td align="char" valign="middle" char=".">0.79</td>
<td align="char" valign="middle" char=",">820.11</td>
<td align="char" valign="top" char=",">1,643.08</td>
<td align="char" valign="middle" char=".">1.05</td>
<td align="char" valign="top" char=",">2,873.25</td>
</tr>
<tr>
<td align="left" valign="middle">3</td>
<td align="char" valign="middle" char=",">23,535</td>
<td align="char" valign="middle" char=",">2,521.85</td>
<td align="char" valign="middle" char=",">1,882.56</td>
<td align="char" valign="middle" char=".">0.75</td>
<td align="char" valign="middle" char=",">1,403.93</td>
<td align="char" valign="top" char=",">2,911.92</td>
<td align="char" valign="middle" char=".">1.86</td>
<td align="char" valign="top" char=",">5,017.82</td>
</tr>
<tr>
<td align="left" valign="middle">4</td>
<td align="char" valign="middle" char=",">6,411</td>
<td align="char" valign="middle" char=",">3,443.37</td>
<td align="char" valign="middle" char=",">2,504.83</td>
<td align="char" valign="middle" char=".">0.73</td>
<td align="char" valign="middle" char=",">1,683.88</td>
<td align="char" valign="top" char=",">4,025.18</td>
<td align="char" valign="middle" char=".">2.57</td>
<td align="char" valign="top" char=",">6,551.00</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>CV, coefficient of variation; IQR, interquartile range; SD, standard deviation.</p>
</table-wrap-foot>
</table-wrap>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption><p>Grouping results and expenses of each group based on the two-stage method.</p></caption>
<graphic xlink:href="fpubh-13-1513744-g003.tif"/>
</fig>
</sec>
</sec>
<sec id="sec17">
<label>3.4</label>
<title>Comparison of the performance and medical expenditure overuse</title>
<p>DRG grouping aims to ensure that patients with similar resource consumptions/medical expenses are put in the same group, thus reasonably controlling the medical expenses of each group. According to the evaluation guidance in the CTS, the performance of the proposed two-stage method is compared with that of the CHS-DRG, as listed in <xref ref-type="table" rid="tab7">Table 7</xref>.</p>
<list list-type="simple">
<list-item><p>(1) Number of groups: The number of groups obtained by the two-stage method is four, which meets the requirements of DRG, and fewer groups (compared with CHS-DRG) lead to easier implementations.</p></list-item>
<list-item><p>(2) The proportion of groups whose CV is less than 0.8: CV is an important index to evaluate the grouping performance, and a smaller CV indicates smaller inter-group variation and higher intra-group homogeneity. According to CTS, a successful grouping result is obtained in groups with a CV of less than 0.8. As shown in <xref ref-type="table" rid="tab7">Table 7</xref>, only 67% of groups obtained by the CHS-DRG have CVs less than 0.8. However, the CV of all groups resulting from the two-stage method is less than 0.8, which shows a significant improvement.</p></list-item>
<list-item><p>(3) Reduction in variance (RIV): In a decision tree, a larger RIV indicates a better grasp of the inherent law of the data and a higher degree of systematization. RIV of the CHS-DRG is 127.94%, but that of the two-stage method is 131.27%.</p></list-item>
</list>
<table-wrap position="float" id="tab7">
<label>Table 7</label>
<caption><p>Comparison of grouping performance between the CHS-DRG and the two-stage grouping method.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Evaluation indicators</th>
<th align="center" valign="top">CHS-DRG</th>
<th align="center" valign="top">Two stage</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">Number of DRG</td>
<td align="center" valign="middle">18</td>
<td align="center" valign="middle">4</td>
</tr>
<tr>
<td align="left" valign="middle">Overall case enrollment rate</td>
<td align="center" valign="middle">100%</td>
<td align="center" valign="middle">100%</td>
</tr>
<tr>
<td align="left" valign="middle">Standardized case enrollment rate</td>
<td align="center" valign="middle">100%</td>
<td align="center" valign="middle">100%</td>
</tr>
<tr>
<td align="left" valign="middle">Proportion of groups whose CV is less than 1</td>
<td align="center" valign="middle">100%</td>
<td align="center" valign="middle">100%</td>
</tr>
<tr>
<td align="left" valign="middle">Proportion of groups whose CV is less than 0.8</td>
<td align="center" valign="middle">67%</td>
<td align="center" valign="middle">100%</td>
</tr>
<tr>
<td align="left" valign="middle">Reasonable proportion of enrolled cases</td>
<td align="center" valign="middle">100%</td>
<td align="center" valign="middle">100%</td>
</tr>
<tr>
<td align="left" valign="middle">Reduction in variance (RIV)</td>
<td align="center" valign="middle">127.94%</td>
<td align="center" valign="middle">131.27%</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>As the implementation of DRG is aimed at controlling the medical expenses of patients in each group within a certain range (<xref ref-type="bibr" rid="ref20">20</xref>), we demonstrate the superiority of applying the two-stage method by comparing it with the CHS-DRG regarding the overuse of medical resources, as listed in <xref ref-type="table" rid="tab8">Tables 8</xref>, <xref ref-type="table" rid="tab9">9</xref>. The 75th quantile plus 1.5 times interquartile range (P75&#x202F;+&#x202F;1.5IQR) of each group is used to calculate the upper limit of medical expense per patient (<xref ref-type="bibr" rid="ref21">21</xref>), listed in the last column of <xref ref-type="table" rid="tab4">Tables 4</xref>, <xref ref-type="table" rid="tab6">6</xref>, respectively. A patient case that spends medical expenses less (respectively larger) than the upper limit in each group is considered to be normal (respectively overuse). All the normal (respectively overuse) cases in a group are incorporated into the normal group (respectively overuse group). The overuse rate, i.e., the proportion of patients in the overuse group, is used to measure the two grouping methods.</p>
<table-wrap position="float" id="tab8">
<label>Table 8</label>
<caption><p>Statistics on medical resources according to the CHS-DRG.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Group number</th>
<th align="center" valign="top" colspan="4">Number of patients</th>
<th align="center" valign="top" colspan="3">Mean (USD$)</th>
<th align="center" valign="top" colspan="2">Median of LOS</th>
<th align="center" valign="top" colspan="2">Average number of CCs</th>
</tr>
<tr>
<th align="center" valign="top">Total</th>
<th align="center" valign="top">Normal group</th>
<th align="center" valign="top">Overuse group</th>
<th align="center" valign="top">Overuse rate (%)</th>
<th align="center" valign="top">Normal group</th>
<th align="center" valign="top">Overuse group</th>
<th align="center" valign="top">Times</th>
<th align="center" valign="top">Normal group</th>
<th align="center" valign="top">Overuse group</th>
<th align="center" valign="top">Normal group</th>
<th align="center" valign="top">Overuse group</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">1</td>
<td align="char" valign="middle" char=",">8,124</td>
<td align="char" valign="middle" char=",">7,908</td>
<td align="center" valign="middle">216</td>
<td align="char" valign="top" char=".">2.66</td>
<td align="char" valign="middle" char=",">402.93</td>
<td align="char" valign="middle" char=",">1,687.42</td>
<td align="char" valign="top" char=".">4.19</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">20</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">6</td>
</tr>
<tr>
<td align="left" valign="middle">2</td>
<td align="char" valign="middle" char=",">16,678</td>
<td align="char" valign="middle" char=",">16,192</td>
<td align="center" valign="middle">486</td>
<td align="char" valign="top" char=".">2.91</td>
<td align="char" valign="middle" char=",">1,082.84</td>
<td align="char" valign="middle" char=",">3,246.01</td>
<td align="char" valign="top" char=".">3</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="middle">25</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">6</td>
</tr>
<tr>
<td align="left" valign="middle">3</td>
<td align="char" valign="middle" char=",">23,599</td>
<td align="char" valign="middle" char=",">21,883</td>
<td align="center" valign="middle">1,716</td>
<td align="char" valign="top" char=".">7.27</td>
<td align="char" valign="middle" char=",">1,700.59</td>
<td align="char" valign="middle" char=",">5,942.31</td>
<td align="char" valign="top" char=".">3.49</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="middle">28</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">5</td>
</tr>
<tr>
<td align="left" valign="middle">4</td>
<td align="char" valign="middle" char=",">6,806</td>
<td align="char" valign="middle" char=",">6,424</td>
<td align="center" valign="middle">382</td>
<td align="char" valign="top" char=".">5.61</td>
<td align="char" valign="middle" char=",">322.34</td>
<td align="char" valign="middle" char=",">999.85</td>
<td align="char" valign="top" char=".">3.1</td>
<td align="center" valign="middle">8</td>
<td align="center" valign="middle">16</td>
<td align="center" valign="middle">3</td>
<td align="center" valign="middle">4</td>
</tr>
<tr>
<td align="left" valign="middle">5</td>
<td align="char" valign="middle" char=",">9,034</td>
<td align="char" valign="middle" char=",">8,649</td>
<td align="center" valign="middle">385</td>
<td align="char" valign="top" char=".">4.26</td>
<td align="char" valign="middle" char=",">859.32</td>
<td align="char" valign="middle" char=",">2,627.81</td>
<td align="char" valign="top" char=".">3.06</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">24</td>
<td align="center" valign="middle">4</td>
<td align="center" valign="middle">6</td>
</tr>
<tr>
<td align="left" valign="middle">6</td>
<td align="char" valign="middle" char=",">11,421</td>
<td align="char" valign="middle" char=",">10,670</td>
<td align="center" valign="middle">751</td>
<td align="char" valign="top" char=".">6.58</td>
<td align="char" valign="middle" char=",">1,318.31</td>
<td align="char" valign="middle" char=",">4,725.59</td>
<td align="char" valign="top" char=".">3.58</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">21</td>
<td align="center" valign="middle">4</td>
<td align="center" valign="middle">5</td>
</tr>
<tr>
<td align="left" valign="middle">7</td>
<td align="char" valign="middle" char=",">1,181</td>
<td align="char" valign="middle" char=",">1,108</td>
<td align="center" valign="middle">73</td>
<td align="char" valign="top" char=".">6.18</td>
<td align="char" valign="middle" char=",">735.50</td>
<td align="char" valign="middle" char=",">2,235.95</td>
<td align="char" valign="top" char=".">3.04</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="middle">27</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
</tr>
<tr>
<td align="left" valign="middle">8</td>
<td align="char" valign="middle" char=",">4,171</td>
<td align="char" valign="middle" char=",">3,852</td>
<td align="center" valign="middle">319</td>
<td align="char" valign="top" char=".">7.65</td>
<td align="char" valign="middle" char=",">1,272.48</td>
<td align="char" valign="middle" char=",">4,921.30</td>
<td align="char" valign="top" char=".">3.87</td>
<td align="center" valign="middle">14</td>
<td align="center" valign="middle">28</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
</tr>
<tr>
<td align="left" valign="middle">9</td>
<td align="char" valign="middle" char=",">6,947</td>
<td align="char" valign="middle" char=",">6,173</td>
<td align="center" valign="middle">774</td>
<td align="char" valign="top" char=".">11.14</td>
<td align="char" valign="middle" char=",">2,153.25</td>
<td align="char" valign="middle" char=",">8,872.48</td>
<td align="char" valign="top" char=".">4.12</td>
<td align="center" valign="middle">13</td>
<td align="center" valign="middle">30</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
</tr>
<tr>
<td align="left" valign="middle">10</td>
<td align="char" valign="middle" char=",">595</td>
<td align="char" valign="middle" char=",">551</td>
<td align="center" valign="middle">44</td>
<td align="char" valign="top" char=".">7.39</td>
<td align="char" valign="middle" char=",">397.63</td>
<td align="char" valign="middle" char=",">1,562.86</td>
<td align="char" valign="top" char=".">3.93</td>
<td align="center" valign="middle">9</td>
<td align="center" valign="middle">23</td>
<td align="center" valign="middle">4</td>
<td align="center" valign="middle">7</td>
</tr>
<tr>
<td align="left" valign="middle">11</td>
<td align="char" valign="middle" char=",">1,974</td>
<td align="char" valign="middle" char=",">1,836</td>
<td align="center" valign="middle">138</td>
<td align="char" valign="top" char=".">6.99</td>
<td align="char" valign="middle" char=",">969.08</td>
<td align="char" valign="middle" char=",">3,374.85</td>
<td align="char" valign="top" char=".">3.48</td>
<td align="center" valign="middle">9</td>
<td align="center" valign="middle">22</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
</tr>
<tr>
<td align="left" valign="middle">12</td>
<td align="char" valign="middle" char=",">3,601</td>
<td align="char" valign="middle" char=",">3,206</td>
<td align="center" valign="middle">395</td>
<td align="char" valign="top" char=".">10.97</td>
<td align="char" valign="middle" char=",">1,627.37</td>
<td align="char" valign="middle" char=",">6,475.59</td>
<td align="char" valign="top" char=".">3.98</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">23</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
</tr>
<tr>
<td align="left" valign="middle">13</td>
<td align="char" valign="middle" char=",">1,499</td>
<td align="char" valign="middle" char=",">1,391</td>
<td align="center" valign="middle">108</td>
<td align="char" valign="top" char=".">7.2</td>
<td align="char" valign="middle" char=",">374.26</td>
<td align="char" valign="middle" char=",">1,186.68</td>
<td align="char" valign="top" char=".">3.17</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">19</td>
<td align="center" valign="middle">1</td>
<td align="center" valign="middle">2</td>
</tr>
<tr>
<td align="left" valign="middle">14</td>
<td align="char" valign="middle" char=",">2,113</td>
<td align="char" valign="middle" char=",">2,006</td>
<td align="center" valign="middle">107</td>
<td align="char" valign="top" char=".">5.06</td>
<td align="char" valign="middle" char=",">839.79</td>
<td align="char" valign="middle" char=",">2,660.06</td>
<td align="char" valign="top" char=".">3.17</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">19</td>
<td align="center" valign="middle">2</td>
<td align="center" valign="middle">0</td>
</tr>
<tr>
<td align="left" valign="middle">15</td>
<td align="char" valign="middle" char=",">4,186</td>
<td align="char" valign="middle" char=",">3,869</td>
<td align="center" valign="middle">317</td>
<td align="char" valign="top" char=".">7.57</td>
<td align="char" valign="middle" char=",">1,493.79</td>
<td align="char" valign="middle" char=",">5,459.46</td>
<td align="char" valign="top" char=".">3.65</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">19</td>
<td align="center" valign="middle">1</td>
<td align="center" valign="middle">0</td>
</tr>
<tr>
<td align="left" valign="middle">16</td>
<td align="char" valign="middle" char=",">3,258</td>
<td align="char" valign="middle" char=",">3,050</td>
<td align="center" valign="middle">208</td>
<td align="char" valign="top" char=".">6.38</td>
<td align="char" valign="middle" char=",">254.29</td>
<td align="char" valign="middle" char=",">784.02</td>
<td align="char" valign="top" char=".">3.08</td>
<td align="center" valign="middle">8</td>
<td align="center" valign="middle">19</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
</tr>
<tr>
<td align="left" valign="middle">17</td>
<td align="char" valign="middle" char=",">1,801</td>
<td align="char" valign="middle" char=",">1,719</td>
<td align="center" valign="middle">82</td>
<td align="char" valign="top" char=".">4.55</td>
<td align="char" valign="middle" char=",">687.13</td>
<td align="char" valign="middle" char=",">2,210.65</td>
<td align="char" valign="top" char=".">3.22</td>
<td align="center" valign="middle">8</td>
<td align="center" valign="middle">17</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">1</td>
</tr>
<tr>
<td align="left" valign="middle">18</td>
<td align="char" valign="middle" char=",">2,326</td>
<td align="char" valign="middle" char=",">2,166</td>
<td align="center" valign="middle">160</td>
<td align="char" valign="top" char=".">6.88</td>
<td align="char" valign="middle" char=",">1,122.33</td>
<td align="char" valign="middle" char=",">3,637.13</td>
<td align="char" valign="top" char=".">3.24</td>
<td align="center" valign="middle">8</td>
<td align="center" valign="middle">15</td>
<td align="center" valign="middle">1</td>
<td align="center" valign="middle">0</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="tab9">
<label>Table 9</label>
<caption><p>Statistics on medical resources according to the two-stage grouping method.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top" rowspan="2">Group number</th>
<th align="center" valign="top" colspan="4">Number of patients</th>
<th align="center" valign="top" colspan="3">Mean</th>
<th align="center" valign="top" colspan="2">Median of LOS</th>
<th align="center" valign="top" colspan="2">avg. Number of CCs</th>
</tr>
<tr>
<th align="center" valign="top">Total</th>
<th align="center" valign="top">Normal group</th>
<th align="center" valign="top">Overuse group</th>
<th align="center" valign="top">Overuse rate (%)</th>
<th align="center" valign="top">Normal group</th>
<th align="center" valign="top">Overuse group</th>
<th align="center" valign="top">Times</th>
<th align="center" valign="top">Normal group</th>
<th align="center" valign="top">Overuse group</th>
<th align="center" valign="top">Normal group</th>
<th align="center" valign="top">Overuse group</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle">1</td>
<td align="char" valign="middle" char=",">28,643</td>
<td align="char" valign="middle" char=",">26,456</td>
<td align="char" valign="middle" char=",">2,187</td>
<td align="char" valign="top" char=".">7.64</td>
<td align="char" valign="middle" char=",">482.91</td>
<td align="char" valign="middle" char=",">1,573.29</td>
<td align="char" valign="top" char=".">3.26</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">19</td>
<td align="center" valign="middle">3</td>
<td align="center" valign="middle">6</td>
</tr>
<tr>
<td align="left" valign="middle">2</td>
<td align="char" valign="middle" char=",">50,725</td>
<td align="char" valign="middle" char=",">47,623</td>
<td align="char" valign="middle" char=",">3,093</td>
<td align="char" valign="top" char=".">6.1</td>
<td align="char" valign="middle" char=",">1,129.17</td>
<td align="char" valign="middle" char=",">3,777.58</td>
<td align="char" valign="top" char=".">3.35</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">24</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">6</td>
</tr>
<tr>
<td align="left" valign="middle">3</td>
<td align="char" valign="middle" char=",">23,535</td>
<td align="char" valign="middle" char=",">21,749</td>
<td align="char" valign="middle" char=",">1,786</td>
<td align="char" valign="top" char=".">7.59</td>
<td align="char" valign="middle" char=",">1,907.56</td>
<td align="char" valign="middle" char=",">6,823.83</td>
<td align="char" valign="top" char=".">3.58</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="middle">27</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">6</td>
</tr>
<tr>
<td align="left" valign="middle">4</td>
<td align="char" valign="middle" char=",">6,411</td>
<td align="char" valign="middle" char=",">5,729</td>
<td align="char" valign="middle" char=",">682</td>
<td align="char" valign="top" char=".">10.64</td>
<td align="char" valign="middle" char=",">2,354.15</td>
<td align="char" valign="middle" char=",">9,349.16</td>
<td align="char" valign="top" char=".">3.97</td>
<td align="center" valign="middle">13</td>
<td align="center" valign="middle">28</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">7</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>For the CHS-DRG, the highest overuse rate is observed in the 9th group, reaching 11.14% and the overuse rate of the 12th group also exceeds 10%, indicating an unbalanced grouping outcome. For the two-stage method, the overuse rates of the first three groups are all less than 8%. Though the overuse rate of the 4th group exceeds 10%, this group only includes a small proportion of patients compared to those in the fourth group. For the average medical expense, a significant difference is observed between each overuse group and the corresponding normal group by the RHS-DRG. For example, the average cost of the overuse group for the 1st and 9th groups is more than four times that of the normal group by the RHS-DRG. In contrast, the average cost of the overuse group for the 5th and 7th groups is approximately three times that of the normal group. By contrast, the difference between each overuse group and the corresponding normal group is relatively small by the two-stage method, which ranges between 3.26 and 3.97. LOS is also an important indicator to show the performance of a grouping method, as a longer time for a patient staying in the hospital usually leads to more resource assumptions. LOS can also implicate the use of resources that cannot be directly reflected by money. These two methods show similar performance on LOS.</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec18">
<label>4</label>
<title>Discussion</title>
<p>The increase in medical expenses in China has outpaced the average growth rate of the national GDP. In the target city, focusing on ischemic stroke (CI), the patient population increased sharply from 22,672 to 55,081 between 2011 and 2018. Concurrently, the average expenditure per patient escalated from USD$ 928 in 2011 to USD$ 1,081 in 2018. This significant increase in medical expenses has imposed a substantial financial burden on the healthcare insurance system. Controlling medical costs has emerged as a critical priority for policymakers. The DRG system, recognized as a sophisticated approach to medical payment management, aims to mitigate inefficiencies and reduce expenditures. This method was initially implemented in Beijing, the capital of China, in 2018. The Chinese government then developed the CHS-DRG and introduced it to 30 other cities. However, the unbalanced economic and regional variations in the disease spectrum pose significant challenges to the applicability of this method since the DRG system is primarily developed using data from the developed regions.</p>
<p>The city selected for our study is located in an economically underdeveloped region in western China. In this city, the medical expenses of CI have witnessed a sharp increase, prompting its selection as the focal point of our research. Using local healthcare data, we categorized patients into groups based on hospitalization costs and clinical profiles. To this end, a novel two-stage method devised specifically for this investigation was developed and compared to the existing CHS-DRG method, which enjoys widespread adoption in China. Our findings indicate that tailoring the classification of CCs according to local characteristics prior to grouping significantly enhances the adaptability of the DRG system. Specifically, in the target city, implementing the two-stage method for DRG could result in savings of approximately USD$ 8.71&#x202F;million. If implemented nationally, this method can potentially alleviate the financial burden on China&#x2019;s healthcare system.</p>
<p>CHS-DRG, recognized as China&#x2019;s most authoritative DRG grouping system (<xref ref-type="bibr" rid="ref4">4</xref>), has been developed by applying the Australian case-mix classification method with data from developed regions in China (<xref ref-type="bibr" rid="ref22">22</xref>). The severity of CCs is determined by their incidence rates. CCs with high incidence rate are considered severe, while those with low incidence are considered general. Our research in a western Chinese city revealed that the CHS-DRG system, while comprehensive, resulted in complex and numerous groups of cases. The incidence rate of CCs in the city is significantly different from the classification in the CHS-DRG, which may be due to the significant regional variance in the disease spectrum since the vast expanse of China leads to the diversity in regional dietary habits and economic disparities. Consequently, the CHS-DRG system may not uniformly apply across the country. It is imperative that each region tailors its DRG grouping strategy to reflect local epidemiological patterns and healthcare needs.</p>
<p>Empirical evidence consistently demonstrates that CCs are significant determinants of healthcare expenditures (<xref ref-type="bibr" rid="ref23">23</xref>). The findings of this study highlight that the incidence rates of CCs exhibit substantial regional disparities. Consequently, applying a uniform set of criteria across the entire country would be imprudent. The fundamental aim of DRG implementation is to optimize cost management in the healthcare system. Therefore, when developing DRG grouping criteria, it is imperative to prioritize the impact of CCs on medical expenditures over their incidence rates. Utilizing data from the local region, we constructed seven regression models in the first stage to classify CCs and, subsequently, in the second stage, grouped the patient cases based on algorithm ID3. This two-stage method significantly enhanced the performance of CCs classification.</p>
<p>The grouping result of the two-stage method is reported in <xref ref-type="table" rid="tab6">Table 6</xref> and that of the CHS-DRG is presented in <xref ref-type="table" rid="tab4">Table 4</xref>. The CHS-DRG obtains 18 groups, but only 4 groups resulted from the two-stage method, which indicates that the two-stage method is notably straightforward, making it easily implementable across a wide range of regions, thereby underscoring its robust practical applicability. These results also suggest that different classifications of CCs can lead to different grouping plans. According to <xref ref-type="table" rid="tab7">Table 7</xref>, the two-stage method significantly improved the CHS-DRG in terms of the proportion of groups with CV less than 80%, from 67 to 100%. The smaller intra group difference of the two-stage method indicates it to be a more reasonable grouping plan for the DRG in the target city.</p>
<p>We used the P75&#x202F;+&#x202F;1.5IQR as the upper limit of each group, listed in <xref ref-type="table" rid="tab4">Tables 4</xref>, <xref ref-type="table" rid="tab6">6</xref> to identify outliers within each group, categorizing these outliers as instances of medical overuse. Based on the two proposed models, the medical resource utilizations between the normal and overuse groups are shown in <xref ref-type="table" rid="tab8">Tables 8</xref>, <xref ref-type="table" rid="tab9">9</xref>, respectively. The medical resources under consideration encompassed several key metrics: the number of patients, average medical expense, and the LOS. Notably, the LOS for the overuse group is significantly more significant compared to the normal group, indicating a potential avenue for cost reduction through LOS management.</p>
<p><xref ref-type="table" rid="tab8">Tables 8</xref>, <xref ref-type="table" rid="tab9">9</xref> also present the average number of CCs in each group for the two methods. This reveals a substantial disparity between the normal and overuse groups within the same DRG group, underscoring the variability in medical resource allocation. In the context of the two-stage method, more CCs are observed in overuse groups than in the corresponding normal group, which aligns with the medical expenses of each group, verifying the importance of considering CCs in assessing medical resource utilization (<xref ref-type="bibr" rid="ref24">24</xref>). An anomaly is observed in the CHS-DRG grouping results, specifically within the 14th, 15th, and 18th groups. Contrary to expectations, the overuse group exhibited fewer CCs than the corresponding normal group, detailed in <xref ref-type="table" rid="tab8">Table 8</xref>, which may be because the CHS-DRG classifies CCs based on the incidence rate and thus some CCs having low incidence rates but high costs are ignored. However, medical expenses, not the incidence rate, matter when developing DRG. For example, hypertension is a common CC of CI, but the cost of treating hypertension is very low, which also implicates the need for improvement in the CHS-DRG.</p>
<p>Furthermore, the average medical expense and number of patients for each overuse group reported in <xref ref-type="table" rid="tab8">Tables 8</xref>, <xref ref-type="table" rid="tab9">9</xref> and the upper limit expenditure for each group in <xref ref-type="table" rid="tab1">Tables 1</xref>, <xref ref-type="table" rid="tab5">5</xref> can contribute to the following insights: Should a stringent full control policy be enforced to curb medical expenditures, it is projected that the implementation of the CHS-DRG would result in an estimated savings of USD$ 8.14&#x202F;million for the target city. Furthermore, the application of our proposed two-stage method could yield even larger savings, with a projected reduction of USD$ 8.59&#x202F;million in medical expenses. This outcome is desirable to the government and the medical insurance department.</p>
</sec>
<sec sec-type="conclusions" id="sec19">
<label>5</label>
<title>Conclusion</title>
<p>Although the CHS-DRG system is recognized as China&#x2019;s most authoritative medical payment, our study indicates that regional customization is essential. CCs should be tailored according to data from local regions rather than adhering to a one-size-fits-all DRG system nationwide. In this research, we used real data from a developing city to identify suitable methods for DRG grouping, thus filling a gap in the extant literature only considers developed regions. We developed a two-stage grouping method through the classification of CCs. The effectiveness of the method was demonstrated using real data, and its performance was analyzed via the comparison with the CHS-DRG.</p>
<p>The scope of this study is limited by the use of data from a single city. To enhance the generalizability of our findings, it is recommended that data from a minimum of three cities be included in future research. Additionally, the absence of a standardized surgical coding system across hospitals has restricted our ability to incorporate surgical codes into the analysis. This finding highlights the necessity for further research that addresses these methodological constraints and expands the scope of our understanding.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec20">
<title>Data availability statement</title>
<p>The datasets presented in this article are not readily available because the data was taken from the Medical Insurance Laboratory of the Healthcare Security Administration of Chengdu and there are administration restrictions. Requests to access the datasets should be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="sec21">
<title>Author contributions</title>
<p>SZ: Conceptualization, Data curation, Investigation, Methodology, Supervision, Writing &#x2013; original draft. XH: Conceptualization, Data curation, Investigation, Methodology, Project administration, Supervision, Writing &#x2013; original draft. JL: Conceptualization, Data curation, Formal analysis, Project administration, Supervision, Writing &#x2013; original draft. LL: Conceptualization, Data curation, Formal analysis, Funding acquisition, Investigation, Software, Writing &#x2013; original draft.</p>
</sec>
<sec sec-type="funding-information" id="sec22">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This project was sponsored by The National Science Foundation of China (grant no. 72001153), Operational Matching Funds of Sichuan University, Chengdu University of Information Technology talent introduction project (grant no. KYTZ2022123), and Henan Zhongyuan Medical Science and Technology Innovation and Development Foundation (grant no. 24YCG1001 and 24YCG2002), and Science and Technology Plan Soft Science Project of Sichuan Province (grant no. 2023JDR0157).</p>
</sec>
<ack>
<p>The authors appreciate the staff in Healthcare Security Administration of the target city (HSAC) for their useful suggestions on data collection.</p>
</ack>
<sec sec-type="COI-statement" id="sec23">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="sec24">
<title>Generative AI statement</title>
<p>The authors declare that no Gen AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="sec25">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec26">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fpubh.2025.1513744/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fpubh.2025.1513744/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.DOCX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>B</given-names></name> <name><surname>Zhang</surname> <given-names>Z</given-names></name> <name><surname>Guo</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>W</given-names></name> <name><surname>Mei</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Perceptions of recurrence risk and behavioural changes among first-ever and recurrent stroke survivors: a qualitative analysis</article-title>. <source>Health Expect</source>. (<year>2021</year>) <volume>24</volume>:<fpage>1962</fpage>&#x2013;<lpage>70</lpage>. doi: <pub-id pub-id-type="doi">10.1111/hex.13335</pub-id>, PMID: <pub-id pub-id-type="pmid">34363288</pub-id></citation></ref>
<ref id="ref2"><label>2.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zeng</surname> <given-names>S</given-names></name> <name><surname>Luo</surname> <given-names>L</given-names></name> <name><surname>Fang</surname> <given-names>Y</given-names></name> <name><surname>He</surname> <given-names>X</given-names></name></person-group>. <article-title>Cost control of treatment for cerebrovascular patients using a machine learning model in western China</article-title>. <source>J Healthc Eng</source>. (<year>2021</year>) <volume>2021</volume>:<fpage>6158961</fpage>. doi: <pub-id pub-id-type="doi">10.1155/2021/6158961</pub-id>, PMID: <pub-id pub-id-type="pmid">34853670</pub-id></citation></ref>
<ref id="ref3"><label>3.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zeng</surname> <given-names>S</given-names></name> <name><surname>Zhang</surname> <given-names>Y</given-names></name> <name><surname>Guo</surname> <given-names>C</given-names></name> <name><surname>Zhou</surname> <given-names>X</given-names></name> <name><surname>He</surname> <given-names>X</given-names></name></person-group>. <article-title>Big data-enabled analysis of factors affecting medical expenditure in the cerebral infarction of a developing City in Western China</article-title>. <source>Risk Manag Healthc Policy</source>. (<year>2023</year>) <volume>16</volume>:<fpage>2703</fpage>&#x2013;<lpage>14</lpage>. doi: <pub-id pub-id-type="doi">10.2147/RMHP.S438869</pub-id>, PMID: <pub-id pub-id-type="pmid">38107438</pub-id></citation></ref>
<ref id="ref4"><label>4.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hadning</surname> <given-names>I</given-names></name> <name><surname>Ikawati</surname> <given-names>Z</given-names></name> <name><surname>Andayani</surname> <given-names>TM</given-names></name></person-group>. <article-title>Stroke treatment cost analysis for consideration on health cost determination using INA-CBGs at Jogja Hospital</article-title>. <source>Int J Public Health Sci</source>. (<year>2015</year>) <volume>4</volume>:<fpage>288</fpage>&#x2013;<lpage>93</lpage>. doi: <pub-id pub-id-type="doi">10.11591/ijphs.v4i4.4748</pub-id></citation></ref>
<ref id="ref5"><label>5.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>SW</given-names></name> <name><surname>Pan</surname> <given-names>Q</given-names></name> <name><surname>Chen</surname> <given-names>T</given-names></name></person-group>. <article-title>Research on diagnosis-related group grouping of inpatient medical expenditure in colorectal cancer patients based on a decision tree model</article-title>. <source>World J Clin Cases</source>. (<year>2020</year>) <volume>8</volume>:<fpage>2484</fpage>&#x2013;<lpage>93</lpage>. doi: <pub-id pub-id-type="doi">10.12998/wjcc.v8.i12.2484</pub-id>, PMID: <pub-id pub-id-type="pmid">32607325</pub-id></citation></ref>
<ref id="ref6"><label>6.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>L</given-names></name> <name><surname>Lang</surname> <given-names>J</given-names></name></person-group>. <article-title>Diagnosis-related groups (DRG) pricing and payment policy in China: where are we?</article-title> <source>Hepatobiliary Surg Nutr</source>. (<year>2020</year>) <volume>9</volume>:<fpage>771</fpage>&#x2013;<lpage>3</lpage>. doi: <pub-id pub-id-type="doi">10.21037/hbsn-2020-8</pub-id>, PMID: <pub-id pub-id-type="pmid">33299831</pub-id></citation></ref>
<ref id="ref7"><label>7.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Panagiotopoulos</surname> <given-names>P</given-names></name> <name><surname>Maniadakis</surname> <given-names>N</given-names></name> <name><surname>Papatheodoridis</surname> <given-names>G</given-names></name> <name><surname>Pektasidis</surname> <given-names>D</given-names></name></person-group>. <article-title>An evaluation of diagnosis-related group (DRG) implementation focused on cancer DRGs in Greek public hospitals</article-title>. <source>Pharmacoecon Open</source>. (<year>2020</year>) <volume>4</volume>:<fpage>61</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s41669-019-0146-z</pub-id>, PMID: <pub-id pub-id-type="pmid">31111448</pub-id></citation></ref>
<ref id="ref8"><label>8.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meng</surname> <given-names>Z</given-names></name> <name><surname>Hui</surname> <given-names>W</given-names></name> <name><surname>Cai</surname> <given-names>Y</given-names></name> <name><surname>Liu</surname> <given-names>J</given-names></name> <name><surname>Wu</surname> <given-names>H</given-names></name></person-group>. <article-title>The effects of DRGs-based payment compared with cost-based payment on inpatient healthcare utilization: a systematic review and meta-analysis</article-title>. <source>Health Policy</source>. (<year>2020</year>) <volume>124</volume>:<fpage>359</fpage>&#x2013;<lpage>67</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.healthpol.2020.01.007</pub-id>, PMID: <pub-id pub-id-type="pmid">32001043</pub-id></citation></ref>
<ref id="ref9"><label>9.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Camilleri</surname> <given-names>C</given-names></name> <name><surname>Jofre-Bonet</surname> <given-names>M</given-names></name> <name><surname>Serra-Sastre</surname> <given-names>V</given-names></name></person-group>. <article-title>The suitability of a DRG casemix system in the Maltese hospital setting</article-title>. <source>Health Policy</source>. (<year>2018</year>) <volume>122</volume>:<fpage>1183</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.healthpol.2018.08.002</pub-id></citation></ref>
<ref id="ref10"><label>10.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zou</surname> <given-names>K</given-names></name> <name><surname>Li</surname> <given-names>HY</given-names></name> <name><surname>Zhou</surname> <given-names>D</given-names></name> <name><surname>Liao</surname> <given-names>ZJ</given-names></name></person-group>. <article-title>The effects of diagnosis-related groups payment on hospital healthcare in China: a systematic review</article-title>. <source>BMC Health Serv Res</source>. (<year>2020</year>) <volume>20</volume>:<fpage>1</fpage>&#x2013;<lpage>11</lpage>. doi: <pub-id pub-id-type="doi">10.1186/s12913-020-4957-5</pub-id>, PMID: <pub-id pub-id-type="pmid">32050962</pub-id></citation></ref>
<ref id="ref11"><label>11.</label><citation citation-type="web"><person-group person-group-type="author"><collab id="coll1">National Healthcare Security Administration</collab></person-group>. <italic>Grouping and payment technical Specifications for the China Healthcare Security Diagnosis Related Groups (CHS-DRG)</italic>. (<year>2019</year>). Available online at: <ext-link xlink:href="https://www.nhsa.gov.cn/art/2019/10/24/art_37_1878.html" ext-link-type="uri">https://www.nhsa.gov.cn/art/2019/10/24/art_37_1878.html</ext-link> (Accessed July 21, 2024).</citation></ref>
<ref id="ref12"><label>12.</label><citation citation-type="web"><person-group person-group-type="author"><collab id="coll2">National Healthcare Security Administration</collab></person-group>. <italic>Grouping plan for the China Healthcare Security Diagnosis Related Groups (CHS-DRG)</italic>. (<year>2019</year>). Available online at: <ext-link xlink:href="https://www.nhsa.gov.cn/module/download/downfile.jsp?classid=0&#x0026;filename=289d4e344c30423b95e33e81ddd086e7.pdf" ext-link-type="uri">https://www.nhsa.gov.cn/module/download/downfile.jsp?classid=0&#x0026;filename=289d4e344c30423b95e33e81ddd086e7.pdf</ext-link> (Accessed July 21, 2024).</citation></ref>
<ref id="ref13"><label>13.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>Y</given-names></name> <name><surname>Yang</surname> <given-names>X</given-names></name> <name><surname>Huang</surname> <given-names>H</given-names></name> <name><surname>Peng</surname> <given-names>C</given-names></name> <name><surname>Ge</surname> <given-names>Y</given-names></name> <name><surname>Wu</surname> <given-names>H</given-names></name> <etal/></person-group>. <article-title>Extreme gradient boosting model has a better performance in predicting the risk of 90-day readmissions in patients with ischaemic stroke</article-title>. <source>J Stroke Cerebrovasc Dis</source>. (<year>2019</year>) <volume>28</volume>:<fpage>104441</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jstrokecerebrovasdis.2019.104441</pub-id>, PMID: <pub-id pub-id-type="pmid">31627995</pub-id></citation></ref>
<ref id="ref14"><label>14.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>J</given-names></name> <name><surname>Ma</surname> <given-names>R</given-names></name> <name><surname>Eleftheriou</surname> <given-names>P</given-names></name> <name><surname>Churilov</surname> <given-names>L</given-names></name> <name><surname>Debono</surname> <given-names>D</given-names></name> <name><surname>Robbins</surname> <given-names>R</given-names></name> <etal/></person-group>. <article-title>Health economic implications of complications associated with pancreaticoduodenectomy at a university hospital: a retrospective cohort cost study</article-title>. <source>HPB</source>. (<year>2018</year>) <volume>20</volume>:<fpage>423</fpage>&#x2013;<lpage>31</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.hpb.2017.11.001</pub-id>, PMID: <pub-id pub-id-type="pmid">29248401</pub-id></citation></ref>
<ref id="ref15"><label>15.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Evers</surname> <given-names>S</given-names></name> <name><surname>Voss</surname> <given-names>G</given-names></name> <name><surname>Nieman</surname> <given-names>F</given-names></name> <name><surname>Ament</surname> <given-names>A</given-names></name> <name><surname>Groot</surname> <given-names>T</given-names></name> <name><surname>Lodder</surname> <given-names>J</given-names></name> <etal/></person-group>. <article-title>Predicting the cost of hospital stay for stroke patients: the use of diagnosis related groups</article-title>. <source>Health Policy</source>. (<year>2002</year>) <volume>61</volume>:<fpage>21</fpage>&#x2013;<lpage>42</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0168-8510(01)00219-6</pub-id>, PMID: <pub-id pub-id-type="pmid">12173495</pub-id></citation></ref>
<ref id="ref16"><label>16.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dodhia</surname> <given-names>RM</given-names></name></person-group>. <article-title>A review of applied multiple regression/correlation analysis for the behavioral sciences</article-title>. <source>J Educ Behav Stat</source>. (<year>2005</year>) <volume>30</volume>:<fpage>227</fpage>&#x2013;<lpage>9</lpage>. doi: <pub-id pub-id-type="doi">10.3102/10769986030002227</pub-id></citation></ref>
<ref id="ref17"><label>17.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rezaianzadeh</surname> <given-names>A</given-names></name> <name><surname>Dastoorpoor</surname> <given-names>M</given-names></name> <name><surname>Sanaei</surname> <given-names>M</given-names></name> <name><surname>Salehnasab</surname> <given-names>C</given-names></name> <name><surname>Mohammadi</surname> <given-names>MJ</given-names></name> <name><surname>Mousavizadeh</surname> <given-names>A</given-names></name></person-group>. <article-title>Predictors of length of stay in the coronary care unit in patient with acute coronary syndrome based on data mining methods</article-title>. <source>Clin Epidemiol Glob Health</source>. (<year>2020</year>) <volume>8</volume>:<fpage>383</fpage>&#x2013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cegh.2019.09.007</pub-id></citation></ref>
<ref id="ref18"><label>18.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>B&#x00FC;nker</surname> <given-names>L</given-names></name> <name><surname>Hanspach</surname> <given-names>KV</given-names></name> <name><surname>Piening</surname> <given-names>A</given-names></name></person-group>. <article-title>Health economic effects after DRG-implementation-A systematic overview</article-title>. <source>Physioscience</source>. (<year>2010</year>) <volume>6</volume>:<fpage>77</fpage>&#x2013;<lpage>8</lpage>. doi: <pub-id pub-id-type="doi">10.1055/s-0029-1245430</pub-id>, PMID: <pub-id pub-id-type="pmid">40115761</pub-id></citation></ref>
<ref id="ref19"><label>19.</label><citation citation-type="other"><person-group person-group-type="author"><name><surname>Fang</surname> <given-names>C</given-names></name> <name><surname>Shao</surname> <given-names>Z</given-names></name> <name><surname>Wu</surname> <given-names>C</given-names></name></person-group>. <italic>A low-cost method for designing and updating a DRGs classifier based on machine learning</italic>. In: Proceedings of the 4th international conference on medical and health informatics, pp. 160&#x2013;164. (<year>2020</year>).</citation></ref>
<ref id="ref20"><label>20.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Annear</surname> <given-names>PL</given-names></name> <name><surname>Kwon</surname> <given-names>S</given-names></name> <name><surname>Lorenzoni</surname> <given-names>L</given-names></name> <name><surname>Duckett</surname> <given-names>S</given-names></name> <name><surname>Huntington</surname> <given-names>D</given-names></name> <name><surname>Langenbrunner</surname> <given-names>JC</given-names></name> <etal/></person-group>. <article-title>Pathways to DRG-based hospital payment systems in Japan, Korea, and Thailand</article-title>. <source>Health Policy</source>. (<year>2018</year>) <volume>122</volume>:<fpage>707</fpage>&#x2013;<lpage>13</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.healthpol.2018.04.013</pub-id>, PMID: <pub-id pub-id-type="pmid">29754969</pub-id></citation></ref>
<ref id="ref21"><label>21.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhi</surname> <given-names>M</given-names></name> <name><surname>Hu</surname> <given-names>L</given-names></name> <name><surname>Geng</surname> <given-names>F</given-names></name> <name><surname>Shao</surname> <given-names>N</given-names></name> <name><surname>Liu</surname> <given-names>Y</given-names></name></person-group>. <article-title>Analysis of the cost and case-mix of post-acute stroke patients in China using quantile regression and the decision-tree models</article-title>. <source>Risk Manag Healthc Policy</source>. (<year>2022</year>) <volume>15</volume>:<fpage>1113</fpage>&#x2013;<lpage>27</lpage>. doi: <pub-id pub-id-type="doi">10.2147/RMHP.S361385</pub-id>, PMID: <pub-id pub-id-type="pmid">35620736</pub-id></citation></ref>
<ref id="ref22"><label>22.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gong</surname> <given-names>Z</given-names></name> <name><surname>Duckett</surname> <given-names>SJ</given-names></name> <name><surname>Legge</surname> <given-names>DG</given-names></name> <name><surname>Pei</surname> <given-names>L</given-names></name></person-group>. <article-title>Describing Chinese hospital activity with diagnosis related groups (DRGs): a case study in Chengdu</article-title>. <source>Health Policy</source>. (<year>2004</year>) <volume>69</volume>:<fpage>93</fpage>&#x2013;<lpage>100</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.healthpol.2003.12.004</pub-id>, PMID: <pub-id pub-id-type="pmid">15484610</pub-id></citation></ref>
<ref id="ref23"><label>23.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ryan</surname> <given-names>SP</given-names></name> <name><surname>Plate</surname> <given-names>JF</given-names></name> <name><surname>Goltz</surname> <given-names>DE</given-names></name> <name><surname>Attarian</surname> <given-names>DE</given-names></name> <name><surname>Wellman</surname> <given-names>SS</given-names></name> <name><surname>Seyler</surname> <given-names>TM</given-names></name> <etal/></person-group>. <article-title>Should medical severity-diagnosis related group classification be utilized for reimbursement? An analysis of elixhauser comorbidities and cost of care</article-title>. <source>J Arthroplast</source>. (<year>2019</year>) <volume>34</volume>:<fpage>1312</fpage>&#x2013;<lpage>6</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.arth.2019.02.045</pub-id>, PMID: <pub-id pub-id-type="pmid">30904362</pub-id></citation></ref>
<ref id="ref24"><label>24.</label><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zaerpour</surname> <given-names>F</given-names></name> <name><surname>Bischak</surname> <given-names>DP</given-names></name> <name><surname>Menezes</surname> <given-names>MB</given-names></name> <name><surname>McRae</surname> <given-names>A</given-names></name> <name><surname>Lang</surname> <given-names>ES</given-names></name></person-group>. <article-title>Patient classification based on volume and case-mix in the emergency department and their association with performance</article-title>. <source>Health Care Manag Sci</source>. (<year>2020</year>) <volume>23</volume>:<fpage>387</fpage>&#x2013;<lpage>400</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s10729-019-09495-z</pub-id>, PMID: <pub-id pub-id-type="pmid">31446556</pub-id></citation></ref>
</ref-list>
</back>
</article>