<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="systematic-review" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Endocrinol.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Endocrinology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Endocrinol.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-2392</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fendo.2026.1740126</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Systematic Review</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Traditional Chinese medicine for type 2 diabetes with metabolic-associated steatotic liver disease: unified effects and design thresholds</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Liu</surname><given-names>Youfang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3268683/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname><given-names>Bibi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname><given-names>Liting</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Xiong</surname><given-names>Haozhe</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname><given-names>Hua</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1121666/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Cheng</surname><given-names>Yang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Institute of Liver Diseases, Shuguang Hospital, Shanghai University of Traditional Chinese Medicine</institution>, <city>Shanghai</city>,&#xa0;<country country="cn">China</country></aff>
<aff id="aff2"><label>2</label><institution>China&#x2013;Japan Friendship Hospital, Beijing University of Chinese Medicine</institution>, <city>Beijing</city>,&#xa0;<country country="cn">China</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Yang Cheng, <email xlink:href="mailto:drchengyang@126.com">drchengyang@126.com</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-03-03">
<day>03</day>
<month>03</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1740126</elocation-id>
<history>
<date date-type="received">
<day>05</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>29</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Liu, Wang, Wang, Xiong, Zhang and Cheng.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Liu, Wang, Wang, Xiong, Zhang and Cheng</copyright-holder>
<license>
<ali:license_ref start_date="2026-03-03">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Objective</title>
<p>This study aims to reorganize randomized controlled trials (RCTs) of traditional Chinese medicine (TCM) for adults with type 2 diabetes mellitus (T2DM) and metabolic-associated steatotic liver disease (MASLD; including legacy NAFLD) into a clinical evidence-anchored knowledge graph (KG) and harmonize effect semantics (&#x201c;unified effects&#x201d;) to support endpoint- and design-aware evidence navigation.</p>
</sec>
<sec>
<title>Methods</title>
<p>We systematically reviewed RCTs (2015&#x2013;2025). Effect direction and scale were unified using a prespecified rule (treatment effect [TE] &gt;0 indicates improvement). The prespecified primary endpoints maximizing cross-trial comparability were alanine aminotransferase (ALT), triglycerides (TG), Homeostatic Model Assessment of Insulin resistance (HOMA-IR), and controlled attenuation parameter (CAP); aspartate aminotransferase (AST) was retained for robustness. Metabolic endpoints were synthesized at the 12-week timepoint, while imaging endpoints (CAP and liver stiffness measurement [LSM]) were synthesized within a prespecified 8- to 24-week window. Trials were stratified as add-on versus mixed, with primary efficacy inferences based on add-on trials with balanced background Western medicine. Evidence was synthesized using REML-based random-effects meta-analysis (reporting prediction intervals) and weighted meta-regression. Risk of bias was assessed using RoB 2 and certainty of evidence using GRADE.</p>
</sec>
<sec>
<title>Results</title>
<p>A total of 95 trials were included (<italic>n</italic> = 8,813; follow-up 2&#x2013;48 weeks; predominantly add-on). The KG linked intervention categories (classic formulas, custom formulas, and Chinese patent medicines) to recurrent syndrome/symptom patterns; <italic>Salvia miltiorrhiza</italic> emerged as a central herb-layer hub. In add-on trials, pooled effects for ALT, AST, HOMA-IR, and TG were directionally favorable, but heterogeneity was substantial and prediction intervals for biochemical endpoints were often wide and crossed the null. CAP showed a comparatively more reproducible short-term imaging signal than LSM. Meta-regression suggested hypothesis-generating design patterns in which estimate stability tended to improve with larger per-arm sample sizes (&#x2248;&#x2265;40&#x2013;50) and longer follow-up (&#x2248;&#x2265;12&#x2013;16 weeks). RoB 2 ratings were predominantly &#x201c;some concerns,&#x201d; and GRADE certainty was commonly downgraded for inconsistency and/or imprecision.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>In adults with T2DM and MASLD, add-on trials show directionally favorable pooled biochemical/metabolic changes after unified effect harmonization, but uncertainty remains substantial. CAP may be a more reproducible short-term imaging endpoint than LSM. Evidence-derived design patterns should be interpreted as hypothesis-generating rather than causal thresholds.</p>
</sec>
<sec>
<title>Systematic Review Registration</title>
<p><ext-link ext-link-type="uri" xlink:href="https://www.crd.york.ac.uk/prospero/">https://www.crd.york.ac.uk/prospero/</ext-link>, identifier CRD420251167450.</p>
</sec>
</abstract>
<kwd-group>
<kwd>interpretable machine learning</kwd>
<kwd>knowledge graph</kwd>
<kwd>meta-analysis</kwd>
<kwd>metabolic-associated steatotic liver disease</kwd>
<kwd>traditional Chinese medicine</kwd>
<kwd>type 2 diabetes mellitus</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was not received for this work and/or its publication.</funding-statement>
</funding-group>
<counts>
<fig-count count="11"/>
<table-count count="1"/>
<equation-count count="2"/>
<ref-count count="32"/>
<page-count count="19"/>
<word-count count="10458"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Clinical Diabetes</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Metabolic dysfunction-associated steatotic liver disease (MASLD), formerly non-alcoholic fatty liver disease (NAFLD), is highly prevalent. Its progression relates to insulin resistance, lipotoxicity, chronic low-grade inflammation, and gut&#x2013;liver axis dysregulation (<xref ref-type="bibr" rid="B1">1</xref>, <xref ref-type="bibr" rid="B2">2</xref>). Type 2 diabetes mellitus (T2DM) frequently coexists with MASLD, mutually aggravating the disease course and risks of fibrosis, cirrhosis, and cardiometabolic events (<xref ref-type="bibr" rid="B3">3</xref>, <xref ref-type="bibr" rid="B4">4</xref>). Epidemiological evidence suggests that MASLD affects approximately two-thirds of adults with T2DM, underscoring the substantial scale of this comorbidity in clinical practice. Beyond prevalence, this coexistence is clinically consequential: metabolic dysregulation and insulin resistance promote hepatic steatosis and inflammation, while MASLD is associated with increased risks of fibrosis progression, cirrhosis, and adverse cardiometabolic events among patients with diabetes (<xref ref-type="bibr" rid="B5">5</xref>&#x2013;<xref ref-type="bibr" rid="B7">7</xref>). Although quantitative imaging&#x2014;controlled attenuation parameter (CAP) and liver stiffness measurement (LSM)&#x2014;supports noninvasive assessment, evidence-based therapeutic strategies for T2DM with MASLD remain constrained by limited indications, population heterogeneity, and inconsistent endpoints (<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B8">8</xref>, <xref ref-type="bibr" rid="B9">9</xref>).</p>
<p>Traditional Chinese medicine (TCM) offers multimodal, phenotype-oriented care potentially relevant to T2DM with MASLD, with therapeutic targets spanning insulin resistance, dyslipidemia, low-grade inflammation, and the gut&#x2013;liver&#x2013;bile acid axis. In practice, classical formulas, custom formulas, Chinese patent medicines, and single herbs are commonly framed by pattern elements such as phlegm-dampness, damp-heat, liver depression, and spleen deficiency (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B11">11</xref>). However, translation of existing RCT evidence into actionable guidance is hindered by methodological barriers: trials vary widely in background therapy (add-on vs. mixed designs), intervention complexity, follow-up duration, and endpoint selection; endpoint direction/scale handling is often inconsistent; and analyses frequently stop at pooled averages without systematically examining effect modifiers, practical design thresholds, or integrated efficacy&#x2013;safety reporting within a prescription&#x2013;syndrome/symptom&#x2013;outcome&#x2013;AE evidence structure (<xref ref-type="bibr" rid="B12">12</xref>, <xref ref-type="bibr" rid="B13">13</xref>).</p>
<p>We aimed to reorganize randomized controlled trials&#x2019; (RCTs) evidence into a prescription&#x2013;syndrome/symptom&#x2013;outcome&#x2013;AE knowledge graph, synthesize effects using random-effects meta-analysis, quantify design thresholds via weighted meta-regression, and derive phenotype-by-target prescribing implications using clustering and interpretable machine learning. To improve interpretability and reproducibility, we implemented an RCT-anchored, multi-layer framework integrating (i) knowledge graph-based evidence organization, (ii) endpoint standardization, (iii) design-stratified random-effects synthesis, and (iv) threshold/moderator assessment via weighted meta-regression and interpretable machine learning.</p>
<p>Specifically, we introduce two methodological concepts to standardize and interpret the evidence. First, &#x201c;unified effects&#x201d; denotes the harmonization of effect direction and scale across heterogeneous endpoints by prespecifying that treatment effect (TE) &gt;0 indicates improvement, thereby enabling cross-endpoint comparability and yielding a coherent &#x201c;outcome fingerprint.&#x201d; Second, &#x201c;design thresholds&#x201d; refer to empirically derived ranges of sample size and follow-up duration (identified via weighted meta-regression and corroborated by the machine learning component) that are associated with more stable and more reproducible effect estimates.</p>
</sec>
<sec id="s2">
<title>Methods</title>
<sec id="s2_1">
<title>Reporting and registration</title>
<p>This review followed PRISMA 2020 guidelines; the protocol was registered in PROSPERO (CRD420251167450).</p>
</sec>
<sec id="s2_2">
<title>Literature search</title>
<p>We systematically searched PubMed, Embase, Web of Science, China National Knowledge Infrastructure (CNKI), Wanfang Data, and VIP Database for studies published from January 2015 to August 2025. A search strategy combining subject headings and free-text terms was adopted, with core concepts including &#x201c;NAFLD/MASLD&#x201d;, &#x201c;T2DM&#x201d;, and &#x201c;traditional Chinese medicine/Chinese herbal medicine/herbal formula&#x201d;. The reference lists of the included studies were screened manually, and citation tracking was performed (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>). Full search strategies and the PRISMA 2020 checklist are provided in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 1</bold></xref>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>PRISMA 2020 flow diagram for study selection.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g001.tif">
<alt-text content-type="machine-generated">Flowchart illustrating study selection process for a systematic review: records identified from multiple databases (n equals three thousand six hundred eighty two), after removing duplicates, three thousand one hundred records screened, two thousand eight hundred twenty eight excluded, leaving ninety five studies included with breakdown by type.</alt-text>
</graphic></fig>
</sec>
<sec id="s2_3">
<title>Eligibility criteria</title>
<p>The inclusion criteria were defined as follows: for study design, RCTs; regarding the study population, adults diagnosed with T2DM complicated by MASLD (including legacy NAFLD terminology; NASH treated as a progressive subtype when explicitly reported); for interventions and comparators, the intervention group received TCM interventions including classical formulas, custom formulas, Chinese patent medicines, or single herbs (with or without concomitant Western medicine), while the control group received conventional Western medicine, placebo, standard care, or lifestyle intervention; for outcomes, at least one prespecified primary outcome was extractable, including alanine aminotransferase (ALT), aspartate aminotransferase (AST), Homeostatic Model Assessment for Insulin Resistance (HOMA-IR), triglycerides (TG), controlled attenuation parameter (CAP), liver stiffness measurement (LSM), and high-density lipoprotein cholesterol (HDL-C). The exclusion criteria included non-RCT study designs, non-pharmacological TCM therapies (e.g., acupuncture, moxibustion), unclear diagnostic criteria for T2DM or MASLD/NAFLD, missing or non-convertible primary outcome data, duplicate publications or overlapping datasets, and non-journal publications (e.g., conference abstracts, dissertations). To ensure standardized reporting, eligibility criteria were explicitly mapped to the PICOS framework: participants (P), adults with T2DM and MASLD/NAFLD; interventions (I), TCM therapies (classical/custom formulas, Chinese patent medicines, or single herbs/extracts) with or without concomitant Western medicine; comparators (C), placebo, standard care, lifestyle intervention, or Western medicine; outcomes (O), at least one prespecified endpoint extractable (primary: ALT, TG, HOMA-IR, CAP; robustness/secondary: AST, HDL-C, LSM); and study design (S), parallel-group randomized controlled trials.</p>
</sec>
<sec id="s2_4">
<title>Data extraction and standardization</title>
<p>Two reviewers independently extracted and cross-checked the data, with discrepancies resolved by arbitration from a third reviewer. At the intervention layer, intervention types and standardized names/codes of formulas were unified; herbal ingredients were aligned with standard names and Latin binomials specified in the Chinese Pharmacopoeia, with syndrome-based modifications annotated (<xref ref-type="bibr" rid="B14">14</xref>). The terminologies for TCM syndromes/symptoms were standardized, and unreported items were recorded as &#x201c;NR&#x201d; (<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>). Study designs were categorized into two types: add-on indicates that both arms received background Western medicine (WM) of comparable drug classes and doses, with TCM added only to the intervention arm; and mixed indicates unequal WM intensity between arms (e.g., WM only in one arm or drug class/dose disparity). When reporting was ambiguous, we defaulted to &#x201c;mixed&#x201d; and ran design-stratified sensitivity analyses.</p>
<p>To strengthen the control of confounding by concomitant Western medicine (WM), we prespecified a trial-design stratification and documented background-therapy information at the trial level (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>). Trials were categorized as add-on versus mixed (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column BA: Design_stratum). Add-on indicates that both arms received comparable background WM (same drug class and dosing rules as reported), with TCM added only to the intervention arm. Mixed indicates that background WM could differ between arms (e.g., WM used in only one arm or drug class/dose disparity) or was not explicitly standardized. For mixed trials, we further coded WM background comparability as balanced/unclear/imbalanced based on extracted WM-related fields (e.g., whether WM was used, WM names, comparator regimen/type/dose) and report this coding in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref> (column AZ: WM_comparability). When reporting was insufficient to judge WM balance, comparability was coded as unclear; such trials were retained in the mixed stratum and addressed via prespecified design-stratified exploratory/sensitivity analyses.</p>
<p>To ensure transparent diagnostic reporting and consistent terminology, we extracted trial-level criteria/definitions for T2DM and MASLD/NAFLD (including legacy NAFLD/NASH wording) and coded ascertainment methods. Specifically, T2DM criteria and MASLD/NAFLD criteria were captured in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref> (columns N and O), and imaging modality and overall ascertainment summaries were captured in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref> (columns BP and BQ). These fields were used for descriptive reporting (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>) and to support trial-level auditability of diagnostic definitions across studies.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Summary characteristics of included RCTs in adults with T2DM and MASLD (<italic>n</italic> = 95).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Characteristic</th>
<th valign="middle" align="left">Overall (<italic>n</italic> = 95)</th>
<th valign="middle" align="left">Add-on design (<italic>n</italic> = 82)</th>
<th valign="middle" align="left">Mixed design (<italic>n</italic> = 13)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Total participants, <italic>N</italic></td>
<td valign="middle" align="left">8,813</td>
<td valign="middle" align="left">7,266</td>
<td valign="middle" align="left">1,547</td>
</tr>
<tr>
<td valign="middle" align="left">Follow-up duration (weeks)</td>
<td valign="middle" align="left">2&#x2013;48; 12 [12&#x2013;12]</td>
<td valign="middle" align="left">2&#x2013;48; 12 [12&#x2013;12]</td>
<td valign="middle" align="left">4&#x2013;24; 12 [12&#x2013;16]</td>
</tr>
<tr>
<td valign="middle" align="left">Sample size per arm</td>
<td valign="middle" align="left">20&#x2013;180; 40 [33&#x2013;54]</td>
<td valign="middle" align="left">20&#x2013;100; 40 [32&#x2013;52]</td>
<td valign="middle" align="left">30&#x2013;180; 40 [38&#x2013;60]</td>
</tr>
<tr>
<td valign="middle" align="left">Country/region</td>
<td valign="middle" align="left">China: 93 (97.9%); other: 2 (2.1%)</td>
<td valign="middle" align="left">China: 80 (97.6%); other: 2 (2.4%)</td>
<td valign="middle" align="left">China:13 (100.0%); other: 0 (0.0%)</td>
</tr>
<tr>
<td valign="middle" align="left">Ascertainment (any)</td>
<td valign="middle" align="left">Guideline: 95 (100.0%)</td>
<td valign="middle" align="left">Guideline: 82 (100.0%)</td>
<td valign="middle" align="left">Guideline: 13 (100.0%)</td>
</tr>
<tr>
<td valign="middle" align="left">Imaging modality reported</td>
<td valign="middle" align="left">US: 75 (78.9%); CAP: 10 (10.5%); liver CT: 6 (6.3%); LSM: 2 (2.1%); MRI-PDFF: 1 (1.1%); &#xb9;H-MRS: 1 (1.1%)</td>
<td valign="middle" align="left">US: 64 (78.0%); CAP: 9 (11.0%); liver CT: 5 (6.1%); LSM: 2 (2.4%); MRI-PDFF: 1 (1.2%); &#xb9;H-MRS: 1 (1.2%)</td>
<td valign="middle" align="left">US: 11 (84.6%); CAP: 1 (7.7%); liver CT: 1 (7.7%); LSM: 0 (0.0%); MRI-PDFF: 0 (0.0%); &#xb9;H-MRS: 0 (0.0%)</td>
</tr>
<tr>
<td valign="middle" align="left">Background therapy reported</td>
<td valign="middle" align="left">Yes: 91 (95.8%); no/unclear: 4 (4.2%)</td>
<td valign="middle" align="left">Yes: 79 (96.3%); no/unclear: 3 (3.7%)</td>
<td valign="middle" align="left">Yes: 12 (92.3%); no/unclear: 1 (7.7%)</td>
</tr>
<tr>
<td valign="middle" align="left">Comparator type</td>
<td valign="middle" align="left">WM/standard care: 87 (91.6%); placebo: 3 (3.2%); other: 5 (5.3%)</td>
<td valign="middle" align="left">WM/standard care: 78 (95.1%); placebo: 3 (3.7%); other: 1 (1.2%)</td>
<td valign="middle" align="left">WM/standard care: 9 (69.2%); placebo: 0; other: 4 (30.8%)</td>
</tr>
<tr>
<td valign="middle" align="left">TCM intervention category</td>
<td valign="middle" align="left">Classical: 25 (26.3%); custom: 49 (51.6%); patent: 17 (17.9%); single: 4 (4.2%)</td>
<td valign="middle" align="left">Classical: 23 (28.0%); Custom: 45 (54.9%); patent: 10 (12.2%); single: 4 (4.9%)</td>
<td valign="middle" align="left">Classical: 2 (15.4%); custom: 4 (30.8%); patent: 7 (53.8%); single: 0</td>
</tr>
<tr>
<td valign="middle" align="left">TCM syndrome/pattern reported</td>
<td valign="middle" align="left">Yes: 60 (63.2%); no: 3 (3.2%); unclear/NR: 32 (33.7%)</td>
<td valign="middle" align="left">Yes: 52 (63.4%); no: 3 (3.7%); unclear/NR: 27 (32.9%)</td>
<td valign="middle" align="left">Yes:8 (61.5%); no: 0; unclear/NR: 5 (38.5%)</td>
</tr>
<tr>
<td valign="middle" align="left">Baseline age (years)</td>
<td valign="middle" align="left">Reported 89/95; 37.70&#x2013;69.88; 54.18 [49.72&#x2013;57.66]</td>
<td valign="middle" align="left">Reported 77/82; 37.70&#x2013;69.88; 54.17 [49.69&#x2013;57.66]</td>
<td valign="middle" align="left">Reported 12/13; 48.34&#x2013;63.46; 55.12 [52.80&#x2013;58.86]</td>
</tr>
<tr>
<td valign="middle" align="left">Male, %</td>
<td valign="middle" align="left">Reported 95/95; 27.63&#x2013;75.00; 55.32 [51.06&#x2013;60.00]</td>
<td valign="middle" align="left">Reported 82/82; 27.63&#x2013;75.00; 55.47 [51.06&#x2013;60.00]</td>
<td valign="middle" align="left">Reported 13/13; 36.36&#x2013;65.57; 54.84 [50.00&#x2013;60.00]</td>
</tr>
<tr>
<td valign="middle" align="left">Baseline BMI (kg/m&#xb2;)</td>
<td valign="middle" align="left">Reported 50/95; 22.60&#x2013;31.09; 26.62 [25.38&#x2013;28.45]</td>
<td valign="middle" align="left">Reported 46/82; 22.60&#x2013;31.09; 26.58 [25.38&#x2013;28.45]</td>
<td valign="middle" align="left">Reported 4/13; 25.73&#x2013;28.64; 27.39 [26.34&#x2013;28.34]</td>
</tr>
<tr>
<td valign="middle" align="left">T2DM duration (years)</td>
<td valign="middle" align="left">Reported 71/95; 0.79&#x2013;26.39; 5.66 [4.46&#x2013;7.11]</td>
<td valign="middle" align="left">Reported 60/82; 1.03&#x2013;26.39; 5.62 [4.42&#x2013;7.18]</td>
<td valign="middle" align="left">Reported 11/13; 0.79&#x2013;10.00; 6.15 [3.20&#x2013;6.86]</td>
</tr>
<tr>
<td valign="middle" align="left">Primary endpoints reported</td>
<td valign="middle" align="left">ALT: 95 (100.0%); TG: 95 (100.0%); HOMA-IR: 60 (63.2%); CAP: 21 (22.1%)</td>
<td valign="middle" align="left">ALT: 82 (100.0%); TG: 82 (100.0%); HOMA-IR: 53 (64.6%); CAP: 20 (24.4%)</td>
<td valign="middle" align="left">ALT: 13 (100.0%); TG: 13 (100.0%); HOMA-IR: 7 (53.8%); CAP: 1 (7.7%)</td>
</tr>
<tr>
<td valign="middle" align="left">Additional/robustness endpoints reported</td>
<td valign="middle" align="left">AST: 84 (88.4%); HDL-C: 30 (31.6%); LSM: 12 (12.6%)</td>
<td valign="middle" align="left">AST: 74 (90.2%); HDL-C: 25 (30.5%); LSM: 11 (13.4%)</td>
<td valign="middle" align="left">AST: 10 (76.9%); HDL-C: 5 (38.5%); LSM: 1 (7.7%)</td>
</tr>
<tr>
<td valign="middle" align="left">Safety reporting</td>
<td valign="middle" align="left">31 (32.6%)</td>
<td valign="middle" align="left">26 (31.7%)</td>
<td valign="middle" align="left">5 (38.5%)</td>
</tr>
<tr>
<td valign="middle" align="left">Risk of bias (RoB 2 overall)</td>
<td valign="middle" align="left">Low: 3 (3.2%); some concerns: 92 (96.8%); high: 0 (0.0%)</td>
<td valign="middle" align="left">Low: 3 (3.7%); some concerns: 79 (96.3%); high: 0 (0.0%)</td>
<td valign="middle" align="left">Low: 0 (0.0%); some concerns: 13 (100.0%); high: 0 (0.0%)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Values are summarized at the trial level. Continuous variables are reported as min&#x2013;max; median [IQR]. Baseline demographics were summarized descriptively using trial-level central values (average of intervention and comparator arms when both were available); the number of trials reporting each variable is provided. Add-on design denotes TCM added to background Western medicine in both arms (TCM + WM vs. WM). Mixed design denotes non-uniform background therapy between arms. AE, adverse event; US, ultrasound; ALT, alanine aminotransferase; AST, aspartate aminotransferase; TG, triglyceride; HDL-C, high-density lipoprotein cholesterol; HOMA-IR, homeostasis model assessment of insulin resistance; CAP, controlled attenuation parameter; LSM, liver stiffness measurement; WM, Western medicine.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>Endpoint means, standard deviations (SD)/standard errors (SE)/95% confidence intervals (95%CI), and units were recorded; data from figures were digitized by two reviewers; time was unified in weeks. Units were retained in their native clinical form (e.g., ALT/AST in U/L; CAP in dB/m), and all syntheses used mean differences (MD) in original units; unit fields and effect-type coding are documented in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;4</bold></xref> (Unit and EffectType columns). Effect sizes and variances were computed in batches in R under a prespecified rule that TE &gt;0 indicates clinical improvement, mapping diverse endpoints onto a common positive-direction scale. Outcome-specific directionality (lower better vs. higher better) was prespecified based on clinical meaning and documented in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;4</bold></xref> (Directionality column). Specifically, for LowerBetter outcomes (ALT, AST, TG, HOMA-IR, CAP, LSM), improvement corresponds to a decrease and TE was defined as:</p>
<disp-formula>
<mml:math display="block" id="M1"><mml:mrow><mml:mi>T</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>X</mml:mi><mml:mo>&#xaf;</mml:mo></mml:mover><mml:mrow><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>o</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>X</mml:mi><mml:mo>&#xaf;</mml:mo></mml:mover><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math>
</disp-formula>
<p>For HigherBetter outcomes (notably HDL-C), improvement corresponds to an increase and TE was defined as:</p>
<disp-formula>
<mml:math display="block" id="M2"><mml:mrow><mml:mi>T</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>X</mml:mi><mml:mo>&#xaf;</mml:mo></mml:mover><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mover accent="true"><mml:mi>X</mml:mi><mml:mo>&#xaf;</mml:mo></mml:mover><mml:mrow><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>o</mml:mi><mml:mi>l</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:math>
</disp-formula>
<p>Mean difference (MD) was used for all outcomes in this review because units were consistent across the included trials; SMD was prespecified only as a contingency when units were not reconcilable but was not required in the final dataset (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;4</bold></xref>, Effect Type column).</p>
<p>As this was a systematic review, no medicinal materials were procured by us. For each included trial, when reported we extracted (i) product type (classic/custom formula, Chinese patent medicine, single herb/extract), (ii) English and Latin names of herbs, and (iii) manufacturer/supplier, approval or batch number, and quality control information (e.g., marker compounds, assay methods) for Chinese patent medicines or extracts. Where trials did not report such information, items were recorded as NR.</p>
</sec>
<sec id="s2_5">
<title>Knowledge graph construction</title>
<p>Entities (formulas/Chinese patent medicines, herbs, TCM syndromes/symptoms, outcomes, adverse events [AEs]) and relations (formula&#x2013;herb; formula&#x2013;syndrome/symptom; formula&#x2013;outcome; formula/Chinese patent medicine&#x2013;AE) were derived from the standardized tables. For each formula &#xd7; outcome pair, aggregated TE and directional consistency informed edge weights/colors; node weights reflected study counts. Multi-arm trials were split by intervention group while retaining trial attributes, including Design_stratum (add-on/mixed) and intervention category metadata. For knowledge-graph visualization, multi-arm trials were represented as separate intervention nodes to preserve intervention-level relations; however, for meta-analytic pooling and meta-regression, shared-control multi-arm structures were handled using prespecified Cochrane-style rules to avoid double-counting (see &#x201c;Meta-analysis&#x201d;&#x2014;handling of multi-arm trials and shared controls). Communities were detected by the Louvain algorithm (labels 1&#x2013;5 used only for description). Details are provided in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>.</p>
<p>Safety/AEs (coding and completeness): Because safety outcomes are frequently underreported, we explicitly distinguished &#x201c;AE not reported (NR/unclear)&#x201d; from &#x201c;AE not observed (explicitly stated no AEs)&#x201d; at the trial level. AE reporting status was coded as reported (Y), explicitly stated no AEs (N; zero events observed), or not reported/unclear (NR/unclear) (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column BH: AE_reported). AE types were summarized only among trials with available safety information (Y or N), and the reported AE spectrum is tabulated in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref> (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;5</bold></xref>) and visualized in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;3</bold></xref>.</p>
</sec>
<sec id="s2_6">
<title>Meta-analysis</title>
<p>From the knowledge graph, we pre-specified primary endpoints to maximize four-domain coverage and cross-trial comparability&#x2014;ALT (<italic>k</italic> &#x2248; 70) and TG (<italic>k</italic> &#x2248; 74) for high evidence density with uniform units, HOMA-IR (<italic>k</italic> &#x2248; 47 after harmonizing spellings) for the metabolic domain, and CAP (<italic>k</italic> &#x2248; 8) as the imaging marker&#x2014;with AST (<italic>k</italic> &#x2248; 77) retained for robustness. These outcomes were predominantly reported as means &#xb1; SD at the most populated 12-week timepoint, permitting MD-based pooling.</p>
<p>To reduce clinical heterogeneity and enhance interpretability, we prespecified a TCM intervention taxonomy using the trial-level variable TCM_category (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column AN): classic and custom denote classic and custom formulas, whereas patent and single denote Chinese patent medicines and single-herb preparations/extracts, respectively. Primary metabolic endpoints (ALT, AST, TG, and HOMA-IR) were analyzed at the 12-week timepoint to maximize comparability across trials. Imaging endpoints (CAP and LSM) were synthesized using a broader 8- to 24-week window due to reporting variability; when multiple timepoints were available, we preferentially selected the latest assessment within the prespecified window.</p>
<p>To strengthen the control of confounding from background WM, we conducted prespecified stratified analyses by trial design (add-on vs. mixed; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column BA) and explicitly assessed background-therapy comparability for mixed trials (balanced/unclear/imbalanced; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column AZ). Accordingly, primary efficacy conclusions are based on add-on trials, while mixed trials are presented as exploratory/sensitivity evidence. In addition, we conducted random-effects meta-analyses stratified by TCM_category (classic/custom/patent/single) and performed sensitivity analyses restricted to formulas only (classic + custom); our main analysis excluded single-herb/extract trials due to sparse evidence and to avoid mixing fundamentally different intervention types, with single-herb/extract trials presented separately as exploratory evidence.</p>
<p>Risk of bias and certainty of evidence: Risk of bias was assessed with the Cochrane RoB 2 tool across five domains (D1: randomization process; D2: deviations from intended interventions; D3: missing outcome data; D4: measurement of the outcome; D5: selection of the reported result) by two independent reviewers with third-party adjudication, and visualized in R (robvis). To ensure transparent and reproducible judgments under common reporting gaps in this literature, we prespecified domain-level decision rules, including explicit handling of missing information (defaulting to &#x201c;some concerns&#x201d; when reporting was insufficient to support a &#x201c;low&#x201d; judgment; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;10</bold></xref>). Certainty of evidence for each primary outcome was evaluated using the GRADE approach and summarized in a Summary of Findings table (downgrading for risk of bias, inconsistency, imprecision, and publication bias as applicable; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;9</bold></xref>).</p>
<p>Handling of multi-arm trials and shared controls: When a trial included multiple eligible TCM arms sharing a single control group, we avoided double-counting the shared control. Following Cochrane guidance, we preferentially combined similar TCM arms within the same TCM_category into a single comparison (pooling means/SDs and sample sizes). If arms could not be meaningfully combined (e.g., belonging to different TCM_category), we split the control group sample size evenly across comparisons for variance estimation while keeping the original control mean and SD unchanged. In all cases, each study contributed at most one independent contrast per TCM_category per outcome&#x2013;time window to the primary pooling.</p>
<p>For data pooling, a restricted maximum likelihood (REML)-based random-effects model was used. We reported the pooled effect size, 95% CI, <italic>I</italic>&#xb2; statistic, <italic>&#x3c4;</italic>&#xb2;, and 95% prediction interval (PI). Prediction intervals were computed for key outcomes to reflect the expected range of effects in a future single study under the random-effects model <inline-formula>
<mml:math display="inline" id="im1"><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mtext>&#x3bc;</mml:mtext><mml:mo>&#xb1;</mml:mo><mml:msub><mml:mi>t</mml:mi><mml:mrow><mml:mi>k</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mn>2</mml:mn><mml:mo>,</mml:mo><mml:mn>0.975</mml:mn></mml:mrow></mml:msub><mml:mo>&#xd7;</mml:mo><mml:msqrt><mml:mrow><mml:mi>S</mml:mi><mml:msubsup><mml:mi>E</mml:mi><mml:mtext>&#x3bc;</mml:mtext><mml:mn>2</mml:mn></mml:msubsup><mml:mo>+</mml:mo><mml:msup><mml:mtext>&#x3c4;</mml:mtext><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:msqrt><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>. Prediction intervals were computed for syntheses with sufficient studies (typically <italic>k</italic> &#x2265; 3). Small-study effects and potential publication bias were assessed using funnel plots. Robustness was examined via Baujat plots, leave-one-out analysis, and top-&#x394; analysis. The PI results are summarized in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref> (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;7</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>S8</bold></xref>).</p>
</sec>
<sec id="s2_7">
<title>Weighted meta-regression</title>
<p>Separate models were fitted for add-on and mixed designs using the rma.mv function, with random effects specified at the study level (SourceID). Sample size (per arm) and treatment course (weeks) served as core covariates (with splines applied if necessary), while herb dosage and intervention type (TCM_category) were included as optional covariates. To minimize within-study dependence and prevent double-counting from multi-arm/shared-control structures, the meta-regression dataset was constructed such that each SourceID contributed at most one effect size per outcome within the prespecified time window (and, when stratified, per TCM_category). Accordingly, the analytic unit for meta-regression and threshold modeling was effectively study-level. This analysis aimed to identify &#x201c;design thresholds,&#x201d; defined as evidence-derived ranges of sample size and duration in which effect estimates show improved stability (i.e., reduced variability) and consistency. Adjusted effect curves, candidate thresholds, and coefficient summaries were outputted.</p>
</sec>
<sec id="s2_8">
<title>Phenotypic clustering and strategy matrix</title>
<p>A binary matrix was constructed based on standardized TCM syndromes/symptoms (reported = 1; unreported [NR] was retained in a separate column). The ConsensusClusterPlus package (Jaccard distance, ward.D2 linkage) was used to evaluate the cumulative distribution function (CDF), &#x394;-area, and sample tracking plots for <italic>K</italic> = 2&#x2013;8 to determine the optimal number of clusters.</p>
<p>Cluster profiles and discriminative features were visualized, and mappings among clusters, prescriptions, and outcomes were used to generate a &#x201c;phenotype &#xd7; prescription&#x201d; strategy matrix.</p>
</sec>
<sec id="s2_9">
<title>Machine learning</title>
<p>For classification (TE &gt; 0) and regression (continuous TE) models, each &#x201c;outcome &#xd7; trial arm&#x201d; was treated as an independent sample. XGBoost was used as the primary model, with glmnet and ranger employed for sensitivity analyses. Model performance was evaluated using fivefold study-grouped cross-validation (GroupKFold by SourceID), such that all rows from the same SourceID were assigned to the same fold to prevent leakage; performance metrics were computed from aggregated out-of-fold (OOF) predictions (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;11</bold></xref>), including ROC-AUC (OOF), PR-AUC (OOF), Brier score (OOF), and calibration diagnostics (e.g., 10-bin ECE; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;11</bold></xref>; calibration curve in <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2C</bold></xref>). As robustness checks, we conducted a leave-one-study-out (LOSO-like) sensitivity analysis and assessed driver stability (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;12</bold></xref>) and performed subset robustness analyses restricting to larger trials (e.g., <italic>n</italic> &#x2265; 40 per arm) or lower-uncertainty effects (e.g., SE_TE &#x2264; median) (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;13</bold></xref>). SHAP (SHapley Additive exPlanations) and ALE (accumulated local effects) were applied to characterize the effects of key features and their evidence-derived, hypothesis-generating threshold intervals.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Model performance and interpretability (OOF). <bold>(A)</bold> ROC curves (grouped cross-validation; AUC shown). <bold>(B)</bold> PR curves. <bold>(C)</bold> Calibration (Brier = 0.112). <bold>(D)</bold> Global SHAP (top 20): trial-level variables&#x2014;<italic>n</italic><sub>treat</sub>/<italic>n</italic><sub>control</sub>, follow-up weeks, design type&#x2014;rank highest. <bold>(E)</bold> ALE for <italic>n</italic><sub>treat</sub>/<italic>n</italic><sub>control</sub>, weeks, SE_TE: small-sample amplification &#x2192; post-threshold stabilization; higher SE_TE is unfavorable. <bold>(F)</bold> PDP (same variables) consistent with ALE.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g002.tif">
<alt-text content-type="machine-generated">Collage of eleven data visualizations showing model evaluation metrics and feature importance, including ROC and calibration curves, a bar chart of top predictors, and line plots of accumulated local effects and partial dependencies for treatment, control, follow-up duration, and standard error.</alt-text>
</graphic></fig>
</sec>
<sec id="s2_10">
<title>Statistical software</title>
<p>All analyses were conducted using R 4.4.1. Key R packages included metafor, meta, clubSandwich, dplyr, ggplot2, ConsensusClusterPlus, tidymodels, xgboost, glmnet, ranger, shapviz, pROC, and showtext. Complete analysis scripts are provided in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 3</bold></xref>.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Basic characteristics</title>
<p>We included 95 randomized controlled trials (RCTs; 2015&#x2013;2025; <italic>n</italic> = 8,813; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S1</bold></xref>). The intervention arms comprised 4,389 participants, and follow-up duration ranged from 2 to 48 weeks overall (median 12 [12&#x2013;12]). The trial-level characteristics for all included RCTs (<italic>n</italic> = 95) are presented in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, and structured datasets supporting the knowledge-graph layers are provided in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref> (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Tables&#xa0;1</bold></xref>-<xref ref-type="supplementary-material" rid="SM1"><bold>S5</bold></xref>). Detailed trial-level diagnostic criteria/definitions and assessment methods are summarized in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref> (columns N&#x2013;O and BP&#x2013;BQ).</p>
<p>As summarized in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>, most trials used an add-on design (<italic>n</italic> = 82; 7,266 participants), with the remainder classified as mixed (<italic>n</italic> = 13; 1,547 participants). The sample size per arm ranged from 20 to 180 (median 40 [33&#x2013;54]). Trials were predominantly conducted in China (93/95, 97.9%), and diagnosis/ascertainment was guideline-based in all studies (95/95, 100%). Ascertainment (diagnostic) imaging modalities were dominated by ultrasound (75/95, 78.9%). CAP-based assessment was used as an ascertainment modality in 10 trials (10.5%), while other modalities were less frequent (liver CT 6/95, 6.3%; LSM 2/95, 2.1%; MRI-PDFF 1/95, 1.1%; and &#xb9;H-MRS 1/95, 1.1%). Background therapy was reported in 91 trials (95.8%). Most comparators were Western medicine/standard care (87/95, 91.6%), with fewer placebo-controlled trials (3/95, 3.2%).</p>
<p>Interventions were mainly TCM compound formulas (74/95, 77.9%; 25 classical and 49 custom), followed by Chinese patent medicines (17/95, 17.9%) and single herbs (4/95, 4.2%). Syndrome/pattern information was reported in 60 trials (63.2%), whereas 32 trials (33.7%) did not report or were unclear/NR. Baseline demographics were variably reported at the trial level: age was available in 89/95 trials (median 54.18 years [49.72&#x2013;57.66]), male proportion in 95/95 (median 55.32% [51.06&#x2013;60.00]), BMI in 50/95 (median 26.62 kg/m&#xb2; [25.38&#x2013;28.45]), and T2DM duration in 71/95 (median 5.66 years [4.46&#x2013;7.11]).</p>
<p>Regarding outcome coverage, ALT and TG were reported in all trials (95/95, 100%), whereas HOMA-IR (60/95, 63.2%) and CAP as an outcome endpoint (21/95, 22.1%) were less frequently reported. Notably, CAP may appear either as an ascertainment modality or as a follow-up endpoint; this proportion here refers specifically to CAP reported as an outcome and is not intended to match ascertainment-modality reporting. Among additional/robustness endpoints, AST was reported in 84 trials (88.4%), HDL-C in 30 (31.6%), and LSM in 12 (12.6%).</p>
<p>Safety reporting was limited: 31 trials (32.6%) reported AE data and 10 (10.5%) explicitly stated that no AEs occurred (zero events observed), while 54 (56.8%) did not report safety outcomes (NR/unclear) (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column BH; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;1</bold></xref>). RoB 2 overall ratings were predominantly &#x201c;some concerns&#x201d; (92/95, 96.8%), with three trials rated &#x201c;low&#x201d; risk and none rated &#x201c;high&#x201d; (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;1</bold></xref>). <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref> provides an at-a-glance roadmap for readers (including non-TCM practitioners), summarizing our end-to-end workflow and key outputs&#x2014;from evidence standardization and knowledge-graph organization to meta-analytic synthesis, design thresholds, and phenotype-guided strategy implications.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Evidence-to-translation roadmap. The diagram integrates the study workflow into four key domains: evidence pipeline: standardization of 95 RCTs (TE &gt; 0) into a structured knowledge graph; unified outcome fingerprint: visual summary of consistent improvements in ALT, AST, HOMA-IR, TG, and CAP (with short-term LSM noted as unstable); design thresholds: empirically derived sample size (&#x2265;40&#x2013;50/arm) and duration (&#x2265;12&#x2013;16 weeks) benchmarks for reproducibility; and strategy matrix: phenotype-stratified prescribing implications (e.g., classical formulas for mild profiles vs. custom formulas for phlegm-damp/heat).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g003.tif">
<alt-text content-type="machine-generated">Scientific infographic illustrating evidence-driven workflows for phenotypic strategies in T2DM with MASLD, showing a knowledge graph and data matrix from 95 RCTs, weighted meta-regression, explainable machine learning, treatment formulae, symptom clusters, chart panels, a co-occurrence network, and performance metrics.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_2">
<title>Knowledge graph construction</title>
<p>Interventions&#x2013;syndromes/symptoms&#x2013;core herbs (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4</bold></xref>) and TCM intervention distribution (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4A</bold></xref>): Classical formulas were most commonly used overall. Banxia Xiexin Decoction appeared in four trials, Qingfei Xiegan Decoction, Modified Erchen Decoction, and Gegen Qinlian Decoction in three trials each, and Huagan Decoction in two. Among custom formulas, Lipi Huatan Quyu appeared in three trials, and Shenmai Lanling Decoction, Huatan Quyu Decoction, and Buxin Tongmai Decoction in two each. For Chinese patent medicines, Liuwei Dihuang Pill appeared in two trials. All remaining TCM interventions each appeared once.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Distribution of interventions, syndromes, symptoms, and herbs (by number of studies). <bold>(A)</bold> Formula frequency by type. <bold>(B)</bold> Top 15 TCM syndromes. <bold>(C)</bold> Top 15 TCM symptoms. <bold>(D)</bold> Top 15 herbs. Bars are stacked by intervention type.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g004.tif">
<alt-text content-type="machine-generated">Four grouped bar charts labeled A through D display data on Chinese medicine interventions. Chart A shows formula frequency by type, with bars indicating classic formulas, creative formulas, and unknown types. Chart B presents top syndromes by intervention type, chart C shows top symptoms, and chart D highlights top herbs, each utilizing stacked bars colored for creative formula, classic formula, and Chinese patent medicine, with the x-axis showing the number of studies.</alt-text>
</graphic></fig>
<p>Top syndromes (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4B</bold></xref>): The leading syndromes were liver depression and spleen deficiency, intermingled phlegm&#x2013;stasis, and Qi&#x2013;Yin deficiency. By category, custom formulas contributed the largest share, followed by classical formulas, with CPMs the least.</p>
<p>Top symptoms (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4C</bold></xref>): Poor appetite, lassitude, and epigastric distension were most common; classical formulas covered the broadest symptom spectrum, then custom formulas, with CPMs the lowest.</p>
<p>Top herbs (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4D</bold></xref>): <italic>Salvia miltiorrhiza</italic> ranked first, followed by <italic>Poria</italic>, <italic>Astragalus membranaceus</italic>, and <italic>Atractylodes macrocephala</italic>. Herb contributions were highest in custom, then classical formulas, and lowest in CPMs.</p>
<p>Interventions&#x2013;syndrome/symptom associations (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5</bold></xref>)&#x2014;formula &#xd7; syndrome network (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5A</bold></xref>). Links were densest for liver depression and spleen deficiency, intermingled phlegm&#x2013;stasis, and Qi&#x2013;Yin deficiency. Custom formulas (e.g., Lipi Huatan Quyu, Shenmai Lanling) predominated, with classical formulas (e.g., Banxia Xiexin, Gegen Qinlian) close behind.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Formula&#x2013;phenotype associations. <bold>(A)</bold> Bipartite network of top 10 formulas &#xd7; top 10 syndromes. <bold>(B)</bold> Formula &#xd7; top 10 symptoms heatmap (primary vs. secondary). <bold>(C)</bold> Sankey: syndrome &#x2192; key symptom &#x2192; formula (five classical + five custom). <bold>(D)</bold> Alluvial: Chinese patent medicine &#x2192; syndrome &#x2192; symptom.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g005.tif">
<alt-text content-type="machine-generated">Panel A shows a network graph mapping the top ten classical and non-classical formulas to syndromes using nodes and connecting lines. Panel B presents a heatmap linking formulas to the ten most frequent primary and secondary symptoms, with color intensity representing reference frequency. Panel C features a Sankey diagram illustrating flows from syndromes to symptoms to formulas, distinguishing classic and non-classic interventions with color. Panel D displays a Sankey diagram of Chinese patent medicines to syndromes to symptoms, with flows indicating frequency and syndrome subtypes. Each visual compares relationships and frequencies related to traditional medicine data.</alt-text>
</graphic></fig>
<p>Formula&#x2013;symptom heatmap (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5B</bold></xref>): Primary symptoms clustered as poor appetite, lassitude/fatigue, abdominal distension, and white greasy tongue coating, with classical formulas showing the most concentrated pairings&#x2014;Banxia Xiexin Decoction and Gegen Qinlian Decoction in particular. Secondary symptoms&#x2014;tooth-marked tongue and abdominal bloating&#x2014;were more extensively covered by custom formulas, notably Lipi Huatan Quyu Formula and Shenmai Lanling Formula.</p>
<p>Sankey diagram (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5C</bold></xref>): The primary syndrome &#x2192; key symptom &#x2192; formula pathway concentrated on liver depression and spleen deficiency, Qi&#x2013;Yin deficiency, and intermingled phlegm&#x2013;stasis. Key symptoms were lassitude/fatigue, poor appetite, tooth-marked tongue, and abdominal distension. Highly connected formulas included classical regimens&#x2014;Compound Gegen Qinlian Formula, Modified Erchen Decoction, Shenling Baizhu Powder plus Erchen Decoction&#x2014;and custom regimens&#x2014;Bushen Jianpi Formula, Yangyin Yunjin Formula, Yixiao Formula.&#x200b; CPM &#x2192; syndrome &#x2192; symptom (<xref ref-type="fig" rid="f5"><bold>Figure&#xa0;5D</bold></xref>). CPMs such as Qinggan Jiangzhuo, Ganhuang, and Tanggankang mainly targeted liver depression and spleen deficiency, spleen deficiency with dampness, or damp heat, corresponding to lassitude/fatigue, poor appetite, and epigastric distension.</p>
<p>Herb co-occurrence, dosage, and processing (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6</bold></xref>)&#x2014;herb&#x2013;herb network (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6A</bold></xref>): <italic>Salvia miltiorrhiza</italic> acted as the strongest hub, forming three clusters: cluster 1: <italic>Salvia miltiorrhiza</italic>&#x2014;<italic>Astragalus membranaceus</italic>&#x2014;<italic>Crataegus pinnatifida</italic> var. <italic>major</italic>/<italic>Citrus reticulata</italic>&#x2014;<italic>Atractylodes macrocephala</italic>; cluster 2: <italic>Pinellia ternata</italic>&#x2014;<italic>Glycyrrhiza uralensis</italic>&#x2014;<italic>Coptis chinensis</italic>&#x2014;<italic>Codonopsis pilosula</italic>/<italic>Pueraria lobata</italic>; side cluster: including <italic>Bupleurum chinense</italic>, connected to <italic>Atractylodes macrocephala</italic>.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Herb co-occurrence, dosage, and processing. <bold>(A)</bold> Herb&#x2013;herb co-occurrence network with Louvain communities. <bold>(B)</bold> Presence/absence heatmap (representative formulas &#xd7; top 30 herbs). <bold>(C)</bold> Dosage heatmap (top 25 herbs; log10 grams). <bold>(D)</bold> Patent medicine &#x2192; herb Sankey.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g006.tif">
<alt-text content-type="machine-generated">Panel A shows a network diagram of the top thirty herbs with nodes sized by co-occurrence strength and colored by community, where edges indicate co-occurrences. Panel B displays a clustered heatmap of the presence or absence of top thirty herbs across multiple formulas, with rows colored by formula type. Panel C presents a clustered heatmap representing log-transformed herb dosage values among the top twenty-five herbs for various formulas, with color gradients indicating dose levels and formula type markers. Panel D features a Sankey diagram linking Chinese patent medicines on the left to herbs on the right, with connections colored by processing type.</alt-text>
</graphic></fig>
<p>Top herbs and modules (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6B</bold></xref>): Classical and custom formulas shared a universal base (<italic>Pinellia</italic>&#x2013;<italic>Poria</italic>&#x2013;<italic>Citrus reticulata</italic>&#x2013;<italic>Atractylodes macrocephala</italic>&#x2013;<italic>Glycyrrhiza</italic>), commonly augmented by selective pairs (<italic>Astragalus</italic> and <italic>Codonopsis</italic>; <italic>Coptis</italic> and <italic>Scutellaria</italic>) and <italic>Bupleurum</italic>.</p>
<p>Dosage heatmap (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6C</bold></xref>): A moderate-dose base (e.g., <italic>Poria</italic>, <italic>Pinellia</italic>, <italic>Citrus reticulata</italic>) was superimposed with high-dose hotspots (e.g., <italic>Salvia</italic>, <italic>Bupleurum</italic>, <italic>Crataegus</italic>).</p>
<p>CPM&#x2013;herb flow diagram (<xref ref-type="fig" rid="f6"><bold>Figure&#xa0;6D</bold></xref>): Various Chinese patent medicines, represented by Ganshuang Granule and Liuwei Dihuang Pill, were mainly connected to core herbs such as <italic>Salvia miltiorrhiza</italic>, <italic>Alisma orientale</italic>, and <italic>Poria cocos</italic>.</p>
<p>Formula&#x2013;syndrome pathways to outcomes (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref>)&#x2014;main pathway (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7A</bold></xref>): Formulas such as Buqi Shugan, Compound Gegen Qinlian, Jianpi Xiaozhi, Lipi Huatan Quyu, and Shenmai Lanling connected to outcomes through intermingled phlegm&#x2013;stasis, liver depression and Qi stagnation, liver depression, and spleen deficiency, and Qi&#x2013;Yin deficiency. Custom formulas tended to map to glucose/lipid metabolism, whereas classical formulas were relatively more oriented to liver function.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Formula&#x2013;syndrome pathways to outcomes. <bold>(A)</bold> Sankey: formula &#x2192; syndrome &#x2192; outcome. <bold>(B)</bold> Heatmap: formula &#xd7; outcome domains. <bold>(C)</bold> Outcome network modules. <bold>(D)</bold> Community&#x2013;outcome mapping. <bold>(E)</bold> Heatmap: high-frequency syndromes &#xd7; outcomes. <bold>(F)</bold> Heatmap: formulas &#xd7; specific outcome indicators. ALT, alanine aminotransferase; AST, aspartate aminotransferase; HOMA-IR, Homeostatic Model Assessment of Insulin Resistance; TG, triglycerides; CAP, controlled attenuation parameter; LSM, liver stiffness measurement.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g007.tif">
<alt-text content-type="machine-generated">Panel A shows a Sankey diagram visualizing links between Chinese medicine formulas, syndromes, and outcome categories distinguished by formula type. Panel B presents a heatmap showing frequency of outcome categories by formula. Panel C displays a network diagram illustrating co-improvement relationships between clinical outcomes, with colored nodes indicating different communities. Panel D provides a Sankey diagram connecting network communities to outcome categories, with colored flows representing node counts. Panel E features a heatmap of syndrome-outcome category frequencies, with shading representing frequency intensity. Panel F presents a heatmap mapping formula-outcome frequency and effect direction for the top twelve formulas across five outcome categories.</alt-text>
</graphic></fig>
<p>Coverage heatmap (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7B</bold></xref>): Shenmai Lanling Formula had the widest coverage across outcomes, especially for glucose metabolism and liver function indicators. Jianpi Xiaozhi Formula, Modified Erchen Formula, and Quzhi Jiangtang The formula mainly focused on glucose and lipid outcomes. Fuzheng Shugan Formula and Compound Gegen Qinlian Formula showed a more balanced distribution, covering liver function, inflammatory immunity, and MASLD-specific indicators.</p>
<p>Outcome&#x2013;outcome network (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7C</bold></xref>): Hubs (ALT/AST, fasting blood glucose (FBG)/hemoglobin A1c(HbA1c), and total cholesterol (TC)/TG) formed modules of liver function, lipids, glycemia/islet, and inflammation/syndromes. The strongest co-improvements were glucose &#x2194; lipids and liver function &#x2194; inflammation, indicating a multidimensional benefit.</p>
<p>Community&#x2013;outcome mapping (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7D</bold></xref>): Louvain-detected communities were mapped as follows: community 1: anthropometry, glucose metabolism, liver function; community 2: lipid metabolism, inflammatory immunity; community 3: MASLD-specific indicators and intestinal flora; communities 4&#x2013;5: molecular biochemistry and TCM-syndrome-related outcomes.</p>
<p>Syndrome &#xd7; outcome (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7E</bold></xref>): Liver depression and spleen deficiency syndrome and intermingled phlegm and stasis syndrome were most frequent, corresponding mainly to glucose metabolism, liver function, and lipid metabolism outcomes.</p>
<p>Formula&#xd7;outcome (<xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7F</bold></xref>; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;2</bold></xref>): TCM interventions such as Gegen Qinlian Decoction, Modified Erchen Decoction, Huatan Quyu Formula, and Liuwei Dihuang Pill reduced FBG, HbA1c, 2-h blood glucose (2hBG), TG, TC, low-density lipoprotein cholesterol (LDL-C), ALT, AST, gamma-glutamyl transferase (GGT), and CAP in &#x2265;2 randomized controlled trials. Supplementary figures showed concentrated dark blocks for classical formulas in glucose control, lipid lowering, and hepatoprotection, whereas custom formulas displayed stronger intensity for insulin resistance/islet function, inflammation/immunity, anthropometry, gut microbiota, and TCM syndrome outcomes.</p>
<p>Safety (reporting completeness and AE spectrum): Safety reporting was incomplete across the included evidence: 31/95 trials (32.6%) explicitly reported AE data, 10/95 trials (10.5%) explicitly stated that no AEs occurred (zero events observed), whereas 54/95 trials (56.8%) did not report safety outcomes (NR/unclear) (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column BH). Accordingly, the AE spectrum is summarized only within trials with available safety information. The reported AEs were mainly mild gastrointestinal and systemic symptoms (e.g., diarrhea, hypoglycemia, gastrointestinal reactions, nausea/vomiting, dizziness, fatigue), with broadly similar distributions across intervention types (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;3</bold></xref>; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;5</bold></xref>).</p>
</sec>
<sec id="s3_3">
<title>Meta-analysis</title>
<p>Heterogeneity and risk-of-bias overview: Across primary biochemical outcomes, heterogeneity was substantial (ALT <italic>I</italic>&#xb2; &#x2248; 98%, AST <italic>I</italic>&#xb2; &#x2248; 96%, HOMA-IR <italic>I</italic>&#xb2; &#x2248; 98%, TG <italic>I</italic>&#xb2; &#x2248; 92%), whereas CAP showed low heterogeneity (<italic>I</italic>&#xb2; &#x2248; 6%) and LSM showed moderate heterogeneity (<italic>I</italic>&#xb2; &#x2248; 64%). Accordingly, we applied REML-based random-effects models and reported &#x3c4;&#xb2;, 95% prediction intervals (PI), and the <italic>p</italic>-value for heterogeneity (<italic>Q</italic> test) for all syntheses. We further explored heterogeneity via prespecified design stratification (add-on vs. mixed) and robustness diagnostics, including funnel plots, Baujat plots, leave-one-out, and top-&#x394; analyses (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figures&#xa0;4</bold></xref>-<xref ref-type="supplementary-material" rid="SM1"><bold>S8</bold></xref>). Intervention-type stratification using the prespecified TCM category (classic/custom/patent/single) showed that the pooled effects for the 12-week biochemical endpoints (ALT/AST/TG/HOMA-IR) remained directionally favorable across classic formulas, custom formulas, and patent medicines, although substantial heterogeneity persisted within strata (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;6</bold></xref>). Evidence for single-herb/extract interventions was sparse (often <italic>k</italic> = 1) and is therefore presented as exploratory; sensitivity analyses restricted to formulas (classic+custom) and excluding single-herb/extract (main) were consistent with the primary conclusions (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;6</bold></xref>).</p>
<p>Risk of bias and certainty of evidence: Using RoB 2 with prespecified decision rules (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;10</bold></xref>), overall risk of bias was predominantly rated as &#x201c;low&#x201d; or &#x201c;some concerns,&#x201d; with concerns most frequently arising from deviations from intended interventions (D2) and missing outcome data (D3); no studies were judged as having an overall &#x201c;high&#x201d; risk of bias (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;1</bold></xref>; domain-level judgments for each trial are provided in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, columns BI&#x2013;BO). Certainty of evidence assessed with GRADE for the primary outcomes is summarized in the Summary of Findings table (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;9</bold></xref>). Given substantial between-study heterogeneity and, for several biochemical endpoints, wide prediction intervals, certainty was commonly downgraded for inconsistency and/or imprecision, and clinical inferences were framed accordingly.</p>
<p>Add-on therapy (primary efficacy analysis; <xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8</bold></xref>): Given balanced background WM regimens by design, the add-on stratum served as the primary basis for efficacy conclusions. In this framework, TCM showed directionally favorable pooled effects for liver enzymes, insulin resistance, and triglycerides. ALT decreased (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8A</bold></xref>; MD &#x2212;8.68, 95% CI &#x2212;10.99 to &#x2212;6.37; I&#xb2;=98.1) and AST decreased (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8B</bold></xref>; MD &#x2212;7.35, 95% CI &#x2212;9.46 to &#x2212;5.23; <italic>I</italic>&#xb2; = 95.9). HOMA-IR decreased (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8C</bold></xref>; MD &#x2212;0.96, 95% CI &#x2212;1.39 to &#x2212;0.53; <italic>I</italic>&#xb2; = 97.5), and TG decreased (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8D</bold></xref>; MD &#x2212;0.53, 95% CI &#x2212;0.68 to &#x2212;0.37; <italic>I</italic>&#xb2; = 92.3). However, the corresponding 95% PIs for ALT, AST, HOMA-IR, and TG crossed the null (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Tables&#xa0;7</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>S8</bold></xref>), indicating that the effect size may vary materially across settings and that a future single trial could plausibly observe attenuated or null effects despite directionally favorable pooled means. HDL-C showed a small decrease, which was unfavorable (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8E</bold></xref>; MD &#x2212;0.13, 95% CI &#x2212;0.23 to &#x2212;0.03; <italic>I</italic>&#xb2; = 95.3).</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Random-effects meta-analysis in add-on trials. <bold>(A)</bold> ALT, <bold>(B)</bold> AST, <bold>(C)</bold> HOMA-IR, <bold>(D)</bold> TG, <bold>(E)</bold> HDL-C, <bold>(F)</bold> CAP. Effect size is mean difference (MD). Directionality (clinical improvement): MD &lt; 0 for ALT/AST/HOMA-IR/TG/CAP and MD &gt; 0 for HDL-C (HigherBetter). Squares indicate study-specific effects (size proportional to inverse-variance weight), horizontal lines show 95% CI, and diamonds denote pooled effects. <italic>&#x3c4;</italic>&#xb2;, <italic>I</italic>&#xb2;, and <italic>Q</italic>-test <italic>p</italic>-values are reported in each panel. For cross-outcome comparability, outcome-specific directionality and TE harmonization (TE &gt; 0 = improvement) are prespecified in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;4</bold></xref>. Additional diagnostics (mixed set; leave-one-out/Baujat; funnel/Egger) are shown in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figures&#xa0;9</bold></xref>-<xref ref-type="supplementary-material" rid="SM1"><bold>S13</bold></xref>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g008.tif">
<alt-text content-type="machine-generated">Forest plots showing results from multiple clinical studies comparing various interventions, with panels labeled A through F. Each panel lists intervention names, sample sizes, mean differences, and confidence intervals. Blue diamonds represent overall summary effects for endpoints: ALT (A), AST (B), HOMA-IR (C), TG (D), HDL-C (E), and CAP (F), with heterogeneity statistics beneath each plot. Each graph displays individual and pooled estimates visually along horizontal axes.</alt-text>
</graphic></fig>
<p>CAP decreased with low heterogeneity (<xref ref-type="fig" rid="f8"><bold>Figure&#xa0;8F</bold></xref>; MD &#x2212;13.72 dB/m, 95% CI &#x2212;20.09 to &#x2212;7.35; <italic>I</italic>&#xb2; = 5.5), indicating a comparatively more reproducible short-term imaging signal. Consistently, CAP showed a 95% PI that did not cross the null (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;7</bold></xref>), supporting a comparatively more reproducible short-term imaging signal. LSM did not show a significant pooled change (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;4F</bold></xref>; MD &#x2212;0.63, 95% CI &#x2212;1.57 to 0.31), with moderate heterogeneity (<italic>I</italic>&#xb2; = 64.3%, <italic>&#x3c4;</italic>&#xb2;= 0.3472; <italic>p</italic> for heterogeneity = 0.0242); its 95% PI crossed the null (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;7</bold></xref>), consistent with study-to-study variability and an unstable short-term stiffness signal.</p>
<p>Mixed therapy (Exploratory analysis; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;4</bold></xref>): Results from mixed-design trials are presented as exploratory findings because background WM regimens may differ between arms or are incompletely reported. Background-therapy comparability for mixed trials was coded as balanced/unclear/imbalanced and is provided in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref> (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column AZ: WM_comparability). Under this framework, ALT, AST, HOMA-IR, and TG showed directions consistent with the add-on analyses, but with smaller magnitudes and persistent heterogeneity; prediction intervals were generally wide and frequently crossed the null (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;8</bold></xref>), reinforcing cautious interpretation.</p>
<p>Bias and robustness: Funnel plots (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figures&#xa0;4G&#x2013;K</bold></xref>) were broadly symmetric for ALT, AST, HOMA-IR, TG; HDL-C showed asymmetry (possible small-study effects/heterogeneity). The Baujat plots (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figures&#xa0;5</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>S6</bold></xref>) indicated that few studies drove Q for ALT/AST/HOMA-IR/TG, and removing them did not change the pooled conclusions; HDL-C showed clustered high-impact points near zero; CAP contributed little and was robust; LSM was study-sensitive and overall non-significant. Leave-one-out and top-&#x394; analyses (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figures&#xa0;7</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>S8</bold></xref>) supported directionally favorable pooled effects for ALT, AST, HOMA-IR, TG, and CAP in the add-on primary set; HDL-C remained non-favorable, and the short-term LSM signal remained variable. In the mixed sets, TG showed the most reproducible pooled signal, whereas ALT/AST/HOMA-IR kept direction with attenuated size; HDL-C was uncertain; LSM was unstable.</p>
</sec>
<sec id="s3_4">
<title>Meta-regression</title>
<p>Most covariate coefficients had 95% CIs crossing zero, indicating no reproducible moderators and aligning with leave-one-out/Baujat findings. ALT, AST, HOMA-IR, TG (<xref ref-type="fig" rid="f9"><bold>Figures&#xa0;9A&#x2013;D</bold></xref>): Improvements were consistent across intervention categories, but moderator effects rarely reached significance. HDL-C (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9E</bold></xref>): Coefficients fluctuated around zero without reproducible favorable moderation. CAP (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9F</bold></xref>): Covariate effects were near zero, supporting CAP as the most robust short-term indicator. LSM (<xref ref-type="fig" rid="f9"><bold>Figure&#xa0;9G</bold></xref>): Directions were inconsistent with wide intervals, suggesting short-term sensitivity to study-level variation. Sample-size thresholds (add-on; one-knot piecewise on n_treat; <xref ref-type="fig" rid="f9"><bold>Figures&#xa0;9H&#x2013;L</bold></xref>). Approximate inflection points (participants per arm): ALT ~50, AST ~34, HOMA-IR ~56, TG ~40, HDL-C ~36. Effects tended to be amplified in smaller samples and stabilized/declined near these thresholds. We therefore recommend &#x2265;40&#x2013;50 participants per arm to improve reproducibility and to mitigate small-study effects.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Meta-regression and breakpoint analysis (add-on). <bold>(A&#x2013;G)</bold> Coefficient forests (REML, Knapp&#x2013;Hartung): <italic>x</italic>-axis = regression coefficient, points = estimate, lines = 95% CI; covariates per method. Direction follows that of <xref ref-type="fig" rid="f7"><bold>Figure&#xa0;7</bold></xref> (ALT/AST/HOMA-IR/TG/CAP/LSM: coef.&lt;0 = greater improvement; HDL-C: coef.&gt;0 = greater improvement). <bold>(H&#x2013;L)</bold> Piecewise regression (1-knot) for <italic>n</italic><sub>treat</sub>: solid = adjusted mean effect; shaded = 95% CI; dashed = estimated breakpoint. Model specification and sensitivity checks are shown in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;14</bold></xref>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g009.tif">
<alt-text content-type="machine-generated">Twelve-panel scientific figure displays meta-regression coefficient plots for various biomarkers and outcome measures labeled A through G, and adjusted effect versus sample size plots with one-knot piecewise breakpoints for biomarkers labeled H through L. Each coefficient plot presents variables on the y-axis and Hedges g effect size on the x-axis with confidence intervals. Each adjusted effect plot shows sample size on the x-axis, adjusted effect on the y-axis, and a breakpoint marked by a vertical dashed line and shaded confidence intervals.</alt-text>
</graphic></fig>
<p>We further reported coefficient forest plots for the mixed set and smoothed marginal-effect curves of n_treat under add-on therapy (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;9</bold></xref>). Most coefficients fluctuated around zero with directions consistent with the main add-on regression and no stable significant moderators. The n_treat curves reproduced the &#x201c;small-sample amplification &#x2192; post-threshold stabilization/decline&#x201d; pattern; the HDL-C curve was nearly flat. After covariate adjustment, improvements in ALT/AST/HOMA-IR/TG and the stable CAP reduction remained; HDL-C showed no clear benefit, and LSM remained unstable. The sample-size thresholds provide a design benchmark (&#x2265;40&#x2013;50 per group) for future studies and interpretation.</p>
</sec>
<sec id="s3_5">
<title>Phenotype clustering and stability assessment</title>
<p>Consensus clustering (<xref ref-type="fig" rid="f10"><bold>Figures&#xa0;10A&#x2013;D</bold></xref>; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;10</bold></xref>): Clustering was performed on symptoms, tongue&#x2013;pulse signs, and syndrome labels. The consensus CDF/&#x394;-area curves showed the largest gain at <italic>k</italic> = 2, after which gains plateaued; tracking plots indicated minimal cross-cluster migration; and the <italic>k</italic> = 2 consensus matrix presented two high-consistency diagonal blocks. Accordingly, <italic>k</italic> = 2 was selected.</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>Phenotype clustering and profiling. <bold>(A)</bold> Consensus CDF, <bold>(B)</bold> &#x394;-area curves, <bold>(C)</bold> tracking plot across <italic>k</italic>, <bold>(D)</bold> consensus matrix at <italic>k</italic> = 2, <bold>(E)</bold> top 30 discriminative-feature heatmap. <italic>k</italic> = 2 yielded the largest stability gain and two high-consistency phenotypes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g010.tif">
<alt-text content-type="machine-generated">Panel A shows a line graph of consensus cumulative distribution functions (CDF) for different cluster numbers, each represented by a distinct color. Panel B displays a line plot depicting the relative change in the area under the CDF curve for various cluster counts. Panel C is a tracking plot with colored vertical bars representing sample assignments across different cluster numbers. Panel D displays a consensus matrix heatmap for k equals two, indicating high agreement in cluster assignments. Panel E presents a heatmap of the top thirty discriminative phenotype features, grouped into two clusters with features labeled on the right and a color scale indicating matrix values.</alt-text>
</graphic></fig>
<p>Cluster profiles (<xref ref-type="fig" rid="f10"><bold>Figure&#xa0;10E</bold></xref>): Cluster 2&#x2014;enriched for phlegm-dampness/damp-heat with qi stagnation and spleen deficiency, characterized by greasy tongue coating, sticky/bitter taste, abdominal fullness/pain, belching, wiry/slippery pulse, red/enlarged tongue with tooth marks, poor appetite, fatigue, loose stools, obesity; cluster 1&#x2014;lighter overall symptom burden (relatively mild phenotype). The two clusters complement each other along a phlegm-dampness &#x2192; damp-heat &#x2192; qi stagnation &#x2192; spleen deficiency axis, with strong clinical interpretability.</p>
</sec>
<sec id="s3_6">
<title>Phenotype-stratified efficacy and formula prioritization</title>
<p>ALT/AST (<xref ref-type="fig" rid="f11"><bold>Figures&#xa0;11A, B</bold></xref>): In both clusters, classical formulas outperformed CPMs, with a larger advantage in cluster 1. HOMA-IR (<xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11C</bold></xref>): The overall effect was small; CPMs were relatively more effective in cluster 2; no significant difference in cluster 1. TG (<xref ref-type="fig" rid="f11"><bold>Figure&#xa0;11D</bold></xref>): Clear phenotype dependence: in cluster 1, CPMs were superior; in cluster 2, classical formulas showed moderate efficacy, whereas CPMs were weaker. Top formulas (<xref ref-type="fig" rid="f11"><bold>Figures&#xa0;11E&#x2013;J</bold></xref>): The top three representatives per phenotype aligned with the mini-meta analyses, providing evidence-based prioritization of formula types by phenotype.</p>
<fig id="f11" position="float">
<label>Figure&#xa0;11</label>
<caption>
<p>Phenotype-stratified intervention matrix and representative formulas. <bold>(A&#x2013;D)</bold> Type&#xd7;phenotype&#xd7;outcome matrices (ALT, AST, HOMA-IR, TG): color = intensity of adjusted effect (Adj. TE). ALT/AST: classical formulas outperform in both phenotypes; HOMA-IR: Chinese patent medicines are superior in cluster 2; TG: prioritization varies by phenotype. <bold>(E&#x2013;H)</bold> Representative formula-level matrices (selected). <bold>(I)</bold> Top 3 per phenotype by intervention type (classical formula/Chinese patent medicine). <bold>(J)</bold> Top 3 per phenotype by formula name (with error bars). Cluster 1 = lower symptom burden; cluster 2 = higher burden with phlegm-dampness/damp-heat.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fendo-17-1740126-g011.tif">
<alt-text content-type="machine-generated">Ten-panel scientific figure displays heatmaps and bar charts. Panels A–D show four heatmaps with two rows and two columns comparing phenotype types and sex for metrics ALT, AST, HOMA-IR, and TG, using a red-yellow color scale. Panels E–H present vertical bar graphs indicating strategy matrix differences by sex and phenotype with red-yellow (and blue in G) gradients. Panels I–J display grouped bar charts listing top-3 phenotypes per type and by name for ALT, AST, HOMA-IR, and TG, with error bars and horizontal labels.</alt-text>
</graphic></fig>
</sec>
<sec id="s3_7">
<title>Predictive performance and interpretable drivers</title>
<p>Model performance (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2A&#x2013;C</bold></xref>): Stratified machine learning on the trial&#x2013;phenotype&#x2013;intervention dataset showed modest discrimination with OOF ROC-AUC = 0.590 (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2A</bold></xref>) and favorable precision&#x2013;recall characteristics (OOF PR-AUC = 0.903; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;11</bold></xref>), with acceptable calibration (Brier = 0.112; 10-bin ECE = 0.065; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;11</bold></xref>; calibration curve in <xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2C</bold></xref>). Sensitivity analyses designed to reduce study-level leakage and assess robustness were directionally consistent (LOSO-like holdout and subset checks; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material S2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Tables&#xa0;12</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>S13</bold></xref>).</p>
<p>Global importance and marginal effects (<xref ref-type="fig" rid="f2"><bold>Figures&#xa0;2D&#x2013;K</bold></xref>). Larger n_treat/n_control, longer follow-up, smaller SE_TE, and add-on design were consistently associated with a higher probability of improvement, displaying a small-sample amplification &#x2192; mid-sample plateau pattern that aligns with weighted regression and inflection-point signals (&#x2265;40&#x2013;50 per group). SE_TE showed a monotonic negative association with improvement probability. Individual SHAP plots reproduced these trends (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;11</bold></xref>).</p>
<p>Driver consistency and response spectrum (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure&#xa0;12</bold></xref>). Across models and outcomes, the top 10/20 drivers were highly consistent. The &#x201c;response spectrum&#x201d; heatmap suggested a learnable coupling among phenotype, formula, and outcome&#x2014;for example, for TG, <italic>Salvia miltiorrhiza</italic>, <italic>Alisma orientale</italic>, and features related to phlegm-dampness/damp-heat/liver depression with spleen deficiency correlated positively with improvement, with a few negatively correlated items also observed (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figures&#xa0;12J, K</bold></xref>).</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>We distill heterogeneous RCT evidence into three evidence-derived, hypothesis-generating rules (summarized in <xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>): (A) Under TE harmonization, the pooled effects for ALT/AST, HOMA-IR, and TG are directionally favorable, but between-study variability is substantial and 95% prediction intervals for several biochemical endpoints are wide and frequently cross the null. In the add-on primary set, CAP provides a comparatively more reproducible short-term imaging signal with low heterogeneity and a PI that does not cross the null (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;7</bold></xref>); (B) Design features such as &#x2265;40&#x2013;50 participants per arm and &#x2265;12&#x2013;16-week follow-up were associated with improved reproducibility/precision of estimates in the published evidence landscape; however, these patterns may reflect correlated design and reporting features (e.g., small-study effects and selective reporting) and should be treated as evidence-derived, hypothesis-generating signals rather than causal thresholds; (C) Time-window alignment matters: prioritize CAP for early windows and reserve LSM for longer follow-up. These rules together translate synthesis into trial-planning anchors and cautious, clinically interpretable guidance that warrants prospective validation. These &#x201c;rules&#x201d; summarize empirical patterns in the available evidence and are intended for trial planning and cautious interpretation rather than prescriptive clinical decision-making.</p>
<p>Most prior studies emphasized herb&#x2013;component&#x2013;target or co-occurrence patterns that are difficult to align with clinical trial evidence and TCM phenotypes (<xref ref-type="bibr" rid="B17">17</xref>&#x2013;<xref ref-type="bibr" rid="B19">19</xref>). Anchored in RCTs, our work restructures the evidence as a formula&#x2013;syndrome&#x2013;symptom&#x2013;outcome&#x2013;safety map, yielding a visual, comparable, and searchable KG. Importantly, the KG is used to organize and navigate evidence rather than to infer causality: apparent differences across interventions can largely reflect reporting architecture&#x2014;numbers of trials, add-on design, background Western medications, follow-up window, and endpoint preferences&#x2014;so we refrain from causal claims. Safety underreporting: Safety reporting is also part of this reporting architecture and was frequently incomplete: over half of the included trials did not report adverse events (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column BH). Therefore, safety observations in this review apply only to the subset of trials with explicit AE information and should not be extrapolated as &#x201c;overall safety.&#x201d; Future RCTs should follow CONSORT harms reporting and explicitly report AE monitoring methods and results even when no events occur. To further mitigate this concern, we explicitly assessed background-therapy comparability for mixed trials and coded it as balanced/unclear/imbalanced (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column AZ), and we interpret mixed findings accordingly as exploratory. Along the syndrome &#x2192; symptom &#x2192; formula pathway, common syndromes (e.g., liver depression and spleen deficiency; intermingled phlegm&#x2013;stasis) link to practical diagnostic clues (lassitude, poor appetite, abdominal distension, tooth-marked tongue) and then to formula categories, providing trial-traceable anchors for syndrome discrimination in practice and for protocol planning (<xref ref-type="bibr" rid="B19">19</xref>).</p>
<p>The herb&#x2013;herb network reveals a three-cluster structure built on a universal base (<italic>Pinellia</italic>&#x2013;<italic>Poria</italic>&#x2013;<italic>Citrus reticulata</italic>&#x2013;<italic>Atractylodes macrocephala</italic>&#x2013;<italic>Glycyrrhiza</italic>), with functional modules (e.g., <italic>Salvia</italic>/<italic>Bupleurum</italic>/<italic>Coptis</italic>; <italic>Scutellaria</italic>/<italic>Astragalus</italic>; <italic>Codonopsis</italic>/<italic>Crataegus</italic>) added as needed. Dosage patterns suggest that most base herbs are used at moderate doses. While these modules do not by themselves imply efficacy differences, they provide objective, pre-matchable building blocks that can support transparent reporting and enable consistent intervention specification when aligning formula design with target outcomes.</p>
<p>Consistent with earlier systematic reviews and meta-analyses reporting improvements in liver enzymes, blood lipids, and insulin resistance under TCM for MASLD&#x2014;while also noting unstable effect sizes and substantial heterogeneity (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B20">20</xref>, <xref ref-type="bibr" rid="B21">21</xref>) &#x2014;our unified metric (TE &gt; 0 = improvement) recovers coherent benefits in ALT, AST, HOMA-IR, and TG. Notably, the prediction intervals for these biochemical endpoints are wide and often cross the null (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Tables&#xa0;7</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>S8</bold></xref>), indicating that the magnitude&#x2014;and in some settings even the presence&#x2014;of benefit may vary across future individual trials despite directionally favorable pooled means. To address concerns about clinical heterogeneity across &#x201c;TCM,&#x201d; we additionally synthesized primary endpoints within prespecified intervention strata (classic formulas, custom formulas, patent medicines, and single-herb/extracts; <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;6</bold></xref>). Pooled effects were directionally favorable across major strata, but substantial residual heterogeneity persisted, and evidence for single-herb/extract interventions was sparse and therefore treated as exploratory. Several systematic reviews and meta-analyses have been published in this area. Epidemiologic SR/MAs have quantified the high burden of MASLD in patients with T2DM at the population level (<xref ref-type="bibr" rid="B7">7</xref>, <xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B22">22</xref>). In parallel, SR/MAs evaluating TCM/Chinese herbal medicine in T2DM with MASLD have generally reported improvements in liver enzymes, lipid profiles, and insulin-resistance-related indices while also emphasizing recurring evidence limitations&#x2014;heterogeneous trial designs, non-uniform background therapy, variable endpoint definitions, and imprecision driven by small samples and short follow-up (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B23">23</xref>). These interpretations are consistent with the GRADE Summary of Findings, in which certainty for primary outcomes was commonly downgraded due to inconsistency and/or imprecision (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;9</bold></xref>).</p>
<p>Compared with these prior SR/MAs, our study differs in both scope and analytical deliverables. First, we reorganize RCT evidence into an RCT-anchored, multi-layer knowledge graph linking formula&#x2013;syndrome/symptom&#x2013;outcome&#x2013;safety, enabling navigation at the &#x201c;phenotype &#xd7; target outcome&#x201d; level rather than reporting pooled averages alone. Second, we implement unified effects (TE &gt; 0 = improvement) to harmonize effect direction across heterogeneous endpoints and pre-specify a cross-domain endpoint set (liver injury, metabolism, lipids, and imaging), thereby reducing pseudo-heterogeneity and yielding a coherent outcome fingerprint. Third, beyond conventional pooling, we evaluate how key design features (including sample size per arm and follow-up duration) relate to effect-estimate stability using weighted meta-regression and interpretable machine learning (SHAP/ALE), providing reproducibility-oriented guidance for future trial planning. To minimize study-level leakage and to frame these ML-derived signals as exploratory, models were evaluated using study-grouped fivefold OOF predictions and additional robustness checks (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material 2</bold></xref>, <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;11</bold></xref>-<xref ref-type="supplementary-material" rid="SM1"><bold>S13</bold></xref>). Finally, we stratified synthesis by trial design (add-on vs. mixed) to improve interpretability under non-uniform background therapy&#x2014;a limitation repeatedly noted in earlier syntheses (<xref ref-type="bibr" rid="B10">10</xref>, <xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B23">23</xref>). Primary efficacy inferences are drawn from the add-on stratum, where background WM regimens are balanced by design, whereas mixed trials are treated as exploratory/sensitivity evidence given variable or incompletely reported co-interventions (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;1</bold></xref>, column AZ).</p>
<p>A quantitative observation from the available evidence is that pooled signals tend to be more reproducible and/or more precise when <italic>n</italic> &#x2265; 40&#x2013;50 per arm and follow-up &#x2265;12&#x2013;16 weeks, although this pattern is exploratory and may be influenced by correlated design and reporting features. Below these thresholds, statistical uncertainty (SE) itself reduces the probability of detecting improvement, implying that much prior &#x201c;instability&#x201d; reflects low signal-to-noise rather than absent effects (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B18">18</xref>). Weighted meta-regression and SHAP/ALE converged on this empirical pattern, which should be interpreted as hypothesis-generating rather than causal.</p>
<p>Because add-on designs dominate and can yield &#x201c;easier&#x201d; improvements, extrapolation to single-agent use is often unclear (<xref ref-type="bibr" rid="B19">19</xref>, <xref ref-type="bibr" rid="B24">24</xref>). While add-on improves SNR and treatment consistency, it may mask marginal effects of individual agents; pooling across differing background intensities can also confound estimates. We therefore recommend prespecified design stratification and sensitivity analyses at the protocol stage as design anchors. Accordingly, we base the principal clinical interpretation on add-on trials and use mixed trials primarily to assess directional consistency under less controlled background therapy.</p>
<p>Regarding imaging endpoints, many studies used LSM as a primary short-term endpoint and reported unstable or null findings over 12&#x2013;24 weeks (<xref ref-type="bibr" rid="B25">25</xref>&#x2013;<xref ref-type="bibr" rid="B27">27</xref>). Our chain of evidence indicates that CAP is more sensitive to near-term hepatic fat change, whereas LSM is influenced by inflammation/congestion and better reflects fibrosis on a delayed time window. Prioritizing CAP and metabolic indices short-term, while reserving LSM for longer-term evaluation, may reduce false negatives caused by time-window mismatch. This interpretation is consistent with our interval evidence: CAP shows a PI that remains below the null, whereas LSM exhibits a PI crossing the null over short follow-up (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;7</bold></xref>), supporting a cautious interpretation of short-term stiffness changes.</p>
<p>Unlike most reviews that emphasize overall pooled average efficacy (<xref ref-type="bibr" rid="B17">17</xref>, <xref ref-type="bibr" rid="B28">28</xref>), we translate synthesis into actionable stratification via clustering and a strategy matrix: when the targets are ALT/AST and TG, classical formulas aimed at clearing turbidity/resolving dampness and regulating qi/harmonizing the middle tended to show directionally favorable pooled signals for enzyme/lipid targets in the available add-on evidence; when the target is HOMA-IR, custom formulas provide broader coverage; in phenotypes with high damp-heat burden, Chinese patent medicines are an optional strategy. These patterns are prioritization cues rather than evidence of superiority, given residual heterogeneity and wide prediction intervals. These guide target &#xd7; phenotype prioritization without asserting causality or mechanism. Notably, our main synthesis excludes single-herb/extract trials due to sparse evidence, and category-specific signals are supported by sensitivity analyses restricted to formulas only (classic + custom) and excluding single-herb/extracts, which yielded consistent overall patterns (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table&#xa0;6</bold></xref>). Accordingly, these category-linked suggestions are intended for prioritization and trial planning, not for ranking individual interventions.</p>
<p>Methodologically, to address inconsistent directional semantics, mixed units, and coarse stratification (<xref ref-type="bibr" rid="B29">29</xref>, <xref ref-type="bibr" rid="B30">30</xref>), we (i) unified directions/units with TE &gt;0 = improvement to mitigate pseudo-heterogeneity, (ii) extended beyond random-effects pooling by using weighted meta-regression to characterize sample-size/follow-up thresholds, and (iii) employed SHAP/ALE to corroborate the nonlinear pattern (&#x2191;SE &#x2192; &#x2193;improvement probability) and to integrate phenotype &#xd7; formula category &#xd7; outcome stability into a navigable matrix. The practical question thus becomes &#x201c;under which conditions and populations are improvements most likely?&#x201d;&#x2014;increasing executability. Where trial-design interpretations are involved, these prioritization cues are anchored primarily in add-on evidence and supported by mixed analyses only as exploratory context.</p>
<p>Compared with prior work (<xref ref-type="bibr" rid="B31">31</xref>, <xref ref-type="bibr" rid="B32">32</xref>), the added value is not asserting one formula &#x201c;best,&#x201d; but offering an implementable framework. Clinically, first, fix the target outcome (e.g., ALT/AST, TG, HOMA-IR) and phenotype (phlegm-dampness/damp-heat vs. liver-depression/spleen-deficiency burden) and then select formula categories. In research, consider adequately powered designs, and if feasible, aim for <italic>n</italic> &#x2265; 40&#x2013;50 per arm with &#x2265;12&#x2013;16 weeks of follow-up; use CAP/metabolic endpoints short-term and add LSM long-term; distinguish add-on intensity with prespecified stratification/sensitivity. These recommendations are evidence-anchored at the outcome level and require prospective validation rather than mechanistic extrapolation.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<title>Conclusion</title>
<p>Anchored in RCT evidence, we built a formula&#x2013;syndrome/symptom&#x2013;outcome&#x2013;safety knowledge graph to support searchable, evidence-ready navigation and trial-planning prioritization. Primary inferences were based on add-on trials with balanced background Western medicine, while mixed designs were interpreted as exploratory. Under this framework, pooled effects for ALT/AST, HOMA-IR, and TG were directionally favorable after TE harmonization, but between-study variability was substantial and prediction intervals often spanned null, indicating that future individual trials could observe attenuated or null effects. CAP provided a comparatively more reproducible short-term imaging signal, whereas short-term LSM remained variable, suggesting that imaging interpretation is sensitive to follow-up window alignment. Evidence-derived design patterns (e.g., larger sample sizes and longer follow-up) and phenotype-guided signals should be regarded as hypothesis-generating rather than causal thresholds, and safety inferences are constrained by substantial harms underreporting, with reported events mainly mild gastrointestinal or systemic symptoms.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Material</bold></xref>. Further inquiries can be directed to the corresponding author.</p></sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>YL: Formal analysis, Methodology, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. BW: Data curation, Formal analysis, Investigation, Methodology, Writing &#x2013; review &amp; editing. LW: Data curation, Formal analysis, Project administration, Writing &#x2013; review &amp; editing. HX: Investigation, Software, Supervision, Writing &#x2013; review &amp; editing. HZ: Data curation, Methodology, Resources, Supervision, Writing &#x2013; review &amp; editing. YC: Conceptualization, Investigation, Project administration, Visualization, Writing &#x2013; review &amp; editing.</p></sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fendo.2026.1740126/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fendo.2026.1740126/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image1.jpeg" id="SF1" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image2.jpeg" id="SF2" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image3.jpeg" id="SF3" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image4.jpeg" id="SF4" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image5.jpeg" id="SF5" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image6.jpeg" id="SF6" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image7.jpeg" id="SF7" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image8.jpeg" id="SF8" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image9.jpeg" id="SF9" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image10.jpeg" id="SF10" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image11.jpeg" id="SF11" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image12.jpeg" id="SF12" mimetype="image/jpeg"/>
<supplementary-material xlink:href="Image13.jpeg" id="SF13" mimetype="image/jpeg"/>
<supplementary-material xlink:href="DataSheet1.pdf" id="SM1" mimetype="application/pdf"/>
<supplementary-material xlink:href="Table1.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Rinella</surname> <given-names>ME</given-names></name>
<name><surname>Lazarus</surname> <given-names>JV</given-names></name>
<name><surname>Ratziu</surname> <given-names>V</given-names></name>
<name><surname>Francque</surname> <given-names>SM</given-names></name>
<name><surname>Sanyal</surname> <given-names>AJ</given-names></name>
<name><surname>Kanwal</surname> <given-names>F</given-names></name>
<etal/>
</person-group>. 
<article-title>A multisociety Delphi consensus statement on new fatty liver disease nomenclature</article-title>. <source>J Hepatol</source>. (<year>2023</year>) <volume>79</volume>:<page-range>1542&#x2013;56</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jhep.2023.06.003</pub-id>, PMID: <pub-id pub-id-type="pmid">37364790</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<label>2</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Stefan</surname> <given-names>N</given-names></name>
<name><surname>Yki-J&#xe4;rvinen</surname> <given-names>H</given-names></name>
<name><surname>Neuschwander-Tetri</surname> <given-names>BA</given-names></name>
</person-group>. 
<article-title>Metabolic dysfunction-associated steatotic liver disease: heterogeneous pathomechanisms and effectiveness of metabolism-based treatment</article-title>. <source>Lancet Diabetes Endocrinol</source>. (<year>2024</year>) <volume>13</volume>:<page-range>134&#x2013;48</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S2213-8587(24)00318-8</pub-id>, PMID: <pub-id pub-id-type="pmid">39681121</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<label>3</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Han</surname> <given-names>E</given-names></name>
<name><surname>Han</surname> <given-names>K-D</given-names></name>
<name><surname>Lee</surname> <given-names>Y-H</given-names></name>
<name><surname>Kim</surname> <given-names>K-S</given-names></name>
<name><surname>Hong</surname> <given-names>S</given-names></name>
<name><surname>Park</surname> <given-names>JH</given-names></name>
<etal/>
</person-group>. 
<article-title>Association of temporal MASLD with type 2 diabetes, cardiovascular disease and mortality</article-title>. <source>Cardiovasc Diabetol</source>. (<year>2025</year>) <volume>24</volume>:<fpage>289</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12933-025-02824-3</pub-id>, PMID: <pub-id pub-id-type="pmid">40665356</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<label>4</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Qi</surname> <given-names>X</given-names></name>
<name><surname>Li</surname> <given-names>J</given-names></name>
<name><surname>Caussy</surname> <given-names>C</given-names></name>
<name><surname>Teng</surname> <given-names>G-J</given-names></name>
<name><surname>Loomba</surname> <given-names>R</given-names></name>
</person-group>. 
<article-title>Epidemiology, screening, and co-management of type 2 diabetes mellitus and metabolic dysfunction-associated steatotic liver disease</article-title>. <source>Hepatology</source>. (<year>2024</year>) <volume>83</volume>:<page-range>661&#x2013;678</page-range>. doi: <pub-id pub-id-type="doi">10.1097/HEP.0000000000000913</pub-id>, PMID: <pub-id pub-id-type="pmid">38722246</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<label>5</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Vilar-Gomez</surname> <given-names>E</given-names></name>
</person-group>. 
<article-title>NAFLD and liver-related events: does type 2 diabetes have a key role</article-title>? <source>Lancet Gastroenterol Hepatol</source>. (<year>2023</year>) <volume>8</volume>:<page-range>777&#x2013;8</page-range>. doi: <pub-id pub-id-type="doi">10.1016/S2468-1253(23)00187-5</pub-id>, PMID: <pub-id pub-id-type="pmid">37419134</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<label>6</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cusi</surname> <given-names>K</given-names></name>
<name><surname>Abdelmalek</surname> <given-names>MF</given-names></name>
<name><surname>Apovian</surname> <given-names>CM</given-names></name>
<name><surname>Balapattabi</surname> <given-names>K</given-names></name>
<name><surname>Bannuru</surname> <given-names>RR</given-names></name>
<name><surname>Barb</surname> <given-names>D</given-names></name>
<etal/>
</person-group>. 
<article-title>Metabolic dysfunction-associated steatotic liver disease (MASLD) in people with diabetes: the need for screening and early intervention. A consensus report of the American diabetes association</article-title>. <source>Diabetes Care</source>. (<year>2025</year>) <volume>48</volume>:<page-range>1057&#x2013;82</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.2337/dci24-0094</pub-id>, PMID: <pub-id pub-id-type="pmid">40434108</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<label>7</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Younossi</surname> <given-names>ZM</given-names></name>
<name><surname>Golabi</surname> <given-names>P</given-names></name>
<name><surname>de Avila</surname> <given-names>L</given-names></name>
<name><surname>Paik</surname> <given-names>JM</given-names></name>
<name><surname>Srishord</surname> <given-names>M</given-names></name>
<name><surname>Fukui</surname> <given-names>N</given-names></name>
<etal/>
</person-group>. 
<article-title>The global epidemiology of NAFLD and NASH in patients with type 2 diabetes: A systematic review and meta-analysis</article-title>. <source>J Hepatol</source>. (<year>2019</year>) <volume>71</volume>:<fpage>793</fpage>&#x2013;<lpage>801</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jhep.2019.06.021</pub-id>, PMID: <pub-id pub-id-type="pmid">31279902</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<label>8</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Castera</surname> <given-names>L</given-names></name>
<name><surname>Garteiser</surname> <given-names>P</given-names></name>
<name><surname>Laouenan</surname> <given-names>C</given-names></name>
<name><surname>Vidal-Tr&#xe9;can</surname> <given-names>T</given-names></name>
<name><surname>Vallet-Pichard</surname> <given-names>A</given-names></name>
<name><surname>Manchon</surname> <given-names>P</given-names></name>
<etal/>
</person-group>. 
<article-title>Prospective head-to-head comparison of non-invasive scores for diagnosis of fibrotic MASH in patients with type 2 diabetes</article-title>. <source>J Hepatol</source>. (<year>2024</year>) <volume>81</volume>:<fpage>195</fpage>&#x2013;<lpage>206</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jhep.2024.03.023</pub-id>, PMID: <pub-id pub-id-type="pmid">38548067</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<label>9</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Jurek</surname> <given-names>JM</given-names></name>
<name><surname>Zablocka-Sowinska</surname> <given-names>K</given-names></name>
<name><surname>Clavero Mestres</surname> <given-names>H</given-names></name>
<name><surname>Reyes Guti&#xe9;rrez</surname> <given-names>L</given-names></name>
<name><surname>Camaron</surname> <given-names>J</given-names></name>
<name><surname>Auguet</surname> <given-names>T</given-names></name>
</person-group>. 
<article-title>The impact of dietary interventions on metabolic outcomes in metabolic dysfunction-associated steatotic liver disease (MASLD) and comorbid conditions, including obesity and type 2 diabetes</article-title>. <source>Nutrients</source>. (<year>2025</year>) <volume>17</volume>:<fpage>1257</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/nu17071257</pub-id>, PMID: <pub-id pub-id-type="pmid">40219014</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<label>10</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cao</surname> <given-names>J</given-names></name>
<name><surname>Bao</surname> <given-names>T</given-names></name>
<name><surname>Cao</surname> <given-names>J</given-names></name>
<name><surname>Fan</surname> <given-names>X</given-names></name>
<name><surname>Wang</surname> <given-names>Y</given-names></name>
<name><surname>Yu</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Metabolic dysfunction-associated fatty liver in type 2 diabetes mellitus patient: can a systematic review of and meta-analysis of commonly used TCM-preparation shed light on their efficacy</article-title>? <source>Front Pharmacol</source>. (<year>2025</year>) <volume>16</volume>:<elocation-id>1578371</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fphar.2025.1578371</pub-id>, PMID: <pub-id pub-id-type="pmid">40894218</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<label>11</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Chi</surname> <given-names>L</given-names></name>
<name><surname>Niu</surname> <given-names>H</given-names></name>
<name><surname>Niu</surname> <given-names>Y</given-names></name>
<name><surname>Yao</surname> <given-names>R</given-names></name>
<name><surname>Shi</surname> <given-names>D</given-names></name>
<name><surname>Lu</surname> <given-names>B</given-names></name>
<etal/>
</person-group>. 
<article-title>Trigonella foenum-graecum L. ameliorates metabolism-associated fatty liver disease in type 2 diabetic mice: a multi-omics mechanism analysis</article-title>. <source>J Ethnopharmacol</source>. (<year>2025</year>) <volume>348</volume>:<fpage>119862</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jep.2025.119862</pub-id>, PMID: <pub-id pub-id-type="pmid">40274034</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<label>12</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Niu</surname> <given-names>S</given-names></name>
<name><surname>Chen</surname> <given-names>S</given-names></name>
<name><surname>Wu</surname> <given-names>D</given-names></name>
<name><surname>Wang</surname> <given-names>C</given-names></name>
<name><surname>Xu</surname> <given-names>J</given-names></name>
<name><surname>Yin</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Multi-omics analysis of hepatic outcomes in T2DM-MAFLD patients treated with semaglutide: a single-centre, longitudinal, data-driven study</article-title>. <source>Front Endocrinol (Lausanne)</source>. (<year>2025</year>) <volume>16</volume>:<elocation-id>1650729</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fendo.2025.1650729</pub-id>, PMID: <pub-id pub-id-type="pmid">41103643</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<label>13</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bhardwaj</surname> <given-names>M</given-names></name>
<name><surname>Mazumder</surname> <given-names>PM</given-names></name>
</person-group>. 
<article-title>The gut-liver axis: emerging mechanisms and therapeutic approaches for nonalcoholic fatty liver disease and type 2 diabetes mellitus</article-title>. <source>Naunyn Schmiedebergs Arch Pharmacol</source>. (<year>2024</year>) <volume>397</volume>:<page-range>8421&#x2013;43</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00210-024-03204-6</pub-id>, PMID: <pub-id pub-id-type="pmid">38861011</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<label>14</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Tian</surname> <given-names>S</given-names></name>
<name><surname>Miao</surname> <given-names>M</given-names></name>
<name><surname>Xiong</surname> <given-names>W</given-names></name>
<name><surname>Xiong</surname> <given-names>W</given-names></name>
<name><surname>Bai</surname> <given-names>M</given-names></name>
<name><surname>Li</surname> <given-names>L</given-names></name>
</person-group>. 
<article-title>Analysis on external application functions and applications of medicinal materials and decoction pieces in Chinese pharmacopoeia (Volume I) 2020 edition</article-title>. <source>Chin J Exp Traditional Med Formulae</source>. (<year>2021</year>) <volume>27</volume>:<page-range>161&#x2013;7</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.13422/j.cnki.syfjx.20202446</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<label>15</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author"><collab>National Standard of the People's Republic of China</collab>
</person-group>. 
<article-title>Clinical terminology of traditional Chinese medicine - part 1: diseases</article-title>. (<year>2023</year>). GB/T 16751.1-2023.
</mixed-citation>
</ref>
<ref id="B16">
<label>16</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author"><collab>National Standard of the People's Republic of China</collab>
</person-group>. 
<article-title>Clinical terminology of traditional Chinese medicine - part 2: syndromes</article-title>. (<year>2021</year>). GB/T 16751.2-2021.
</mixed-citation>
</ref>
<ref id="B17">
<label>17</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shi</surname> <given-names>R</given-names></name>
<name><surname>Chai</surname> <given-names>K</given-names></name>
<name><surname>Wang</surname> <given-names>H</given-names></name>
<name><surname>Guo</surname> <given-names>S</given-names></name>
<name><surname>Zhai</surname> <given-names>Y</given-names></name>
<name><surname>Huang</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Comparative effectiveness of five Chinese patent medicines for non-alcoholic fatty liver disease: A systematic review and Bayesian network meta-analysis</article-title>. <source>Phytomedicine</source>. (<year>2024</year>) <volume>135</volume>:<fpage>156124</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.phymed.2024.156124</pub-id>, PMID: <pub-id pub-id-type="pmid">39388923</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<label>18</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhang</surname> <given-names>Y</given-names></name>
<name><surname>Liu</surname> <given-names>T</given-names></name>
<name><surname>Zhang</surname> <given-names>L</given-names></name>
<name><surname>Pu</surname> <given-names>Z</given-names></name>
<name><surname>Yan</surname> <given-names>Z</given-names></name>
<name><surname>Hua</surname> <given-names>H</given-names></name>
</person-group>. 
<article-title>Wendan decoction in the treatment of nonalcoholic fatty liver disease: A systematic review and meta-analysis</article-title>. <source>Front Pharmacol</source>. (<year>2022</year>) <volume>13</volume>:<elocation-id>1039611</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fphar.2022.1039611</pub-id>, PMID: <pub-id pub-id-type="pmid">36324682</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<label>19</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Peng</surname> <given-names>S</given-names></name>
<name><surname>Liu</surname> <given-names>L</given-names></name>
<name><surname>Xie</surname> <given-names>Z</given-names></name>
<name><surname>Zhang</surname> <given-names>X</given-names></name>
<name><surname>Xie</surname> <given-names>C</given-names></name>
<name><surname>Ye</surname> <given-names>S</given-names></name>
<etal/>
</person-group>. 
<article-title>Chinese herbal medicine for type 2 diabetes mellitus with nonalcoholic fatty liver disease: A systematic review and meta-analysis</article-title>. <source>Front Pharmacol</source>. (<year>2022</year>) <volume>13</volume>:<elocation-id>863839</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fphar.2022.863839</pub-id>, PMID: <pub-id pub-id-type="pmid">35833030</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<label>20</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Li</surname> <given-names>X</given-names></name>
<name><surname>He</surname> <given-names>J</given-names></name>
<name><surname>Sun</surname> <given-names>Q</given-names></name>
</person-group>. 
<article-title>The prevalence and effects of sarcopenia in patients with metabolic dysfunction-associated steatotic liver disease (MASLD): A systematic review and meta-analysis</article-title>. <source>Clin Nutr</source>. (<year>2024</year>) <volume>43</volume>:<page-range>2005&#x2013;16</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.clnu.2024.07.006</pub-id>, PMID: <pub-id pub-id-type="pmid">39053329</pub-id>
</mixed-citation>
</ref>
<ref id="B21">
<label>21</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Huang</surname> <given-names>Q</given-names></name>
<name><surname>An</surname> <given-names>Z</given-names></name>
<name><surname>Xin</surname> <given-names>X</given-names></name>
<name><surname>Gou</surname> <given-names>X</given-names></name>
<name><surname>Tian</surname> <given-names>X</given-names></name>
<name><surname>Hu</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>The effectiveness of curcumin, resveratrol, and silymarin on MASLD: A systematic review and meta-analysis</article-title>. <source>Food Sci Nutr</source>. (<year>2024</year>) <volume>12</volume>:<page-range>10010&#x2013;29</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/fsn3.4595</pub-id>, PMID: <pub-id pub-id-type="pmid">39723101</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<label>22</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>En Li Cho</surname> <given-names>E</given-names></name>
<name><surname>Ang</surname> <given-names>CZ</given-names></name>
<name><surname>Quek</surname> <given-names>J</given-names></name>
<name><surname>Fu</surname> <given-names>CE</given-names></name>
<name><surname>Lim</surname> <given-names>LKE</given-names></name>
<name><surname>Heng</surname> <given-names>ZEQ</given-names></name>
<etal/>
</person-group>. 
<article-title>Global prevalence of non-alcoholic fatty liver disease in type 2 diabetes mellitus: an updated systematic review and meta-analysis</article-title>. <source>Gut</source>. (<year>2023</year>) <volume>72</volume>:<page-range>2138&#x2013;48</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/gutjnl-2023-330110</pub-id>, PMID: <pub-id pub-id-type="pmid">37491159</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<label>23</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liang</surname> <given-names>Z</given-names></name>
<name><surname>Chen</surname> <given-names>X</given-names></name>
<name><surname>Shi</surname> <given-names>J</given-names></name>
<name><surname>Hu</surname> <given-names>H</given-names></name>
<name><surname>Xue</surname> <given-names>Y</given-names></name>
<name><surname>Ung</surname> <given-names>COL</given-names></name>
</person-group>. 
<article-title>Efficacy and safety of traditional Chinese medicines for non-alcoholic fatty liver disease: a systematic literature review of randomized controlled trials</article-title>. <source>Chin Med</source>. (<year>2021</year>) <volume>16</volume>:<fpage>9</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13020-020-00422-x</pub-id>, PMID: <pub-id pub-id-type="pmid">33430929</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<label>24</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Nie</surname> <given-names>Q</given-names></name>
<name><surname>Li</surname> <given-names>M</given-names></name>
<name><surname>Huang</surname> <given-names>C</given-names></name>
<name><surname>Yuan</surname> <given-names>Y</given-names></name>
<name><surname>Liang</surname> <given-names>Q</given-names></name>
<name><surname>Ma</surname> <given-names>X</given-names></name>
<etal/>
</person-group>. 
<article-title>The clinical efficacy and safety of berberine in the treatment of non-alcoholic fatty liver disease: a meta-analysis and systematic review</article-title>. <source>J Transl Med</source>. (<year>2024</year>) <volume>22</volume>:<fpage>225</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12967-024-05011-2</pub-id>, PMID: <pub-id pub-id-type="pmid">38429794</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<label>25</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>M&#xf3;zes</surname> <given-names>FE</given-names></name>
<name><surname>Lee</surname> <given-names>JA</given-names></name>
<name><surname>Selvaraj</surname> <given-names>EA</given-names></name>
<name><surname>Jayaswal</surname> <given-names>ANA</given-names></name>
<name><surname>Trauner</surname> <given-names>M</given-names></name>
<name><surname>Boursier</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Diagnostic accuracy of non-invasive tests for advanced fibrosis in patients with NAFLD: an individual patient data meta-analysis</article-title>. <source>Gut</source>. (<year>2021</year>) <volume>71</volume>:<page-range>1006&#x2013;19</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1136/gutjnl-2021-324243</pub-id>, PMID: <pub-id pub-id-type="pmid">34001645</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<label>26</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Selvaraj</surname> <given-names>EA</given-names></name>
<name><surname>M&#xf3;zes</surname> <given-names>FE</given-names></name>
<name><surname>Jayaswal</surname> <given-names>ANA</given-names></name>
<name><surname>Zafarmand</surname> <given-names>MH</given-names></name>
<name><surname>Vali</surname> <given-names>Y</given-names></name>
<name><surname>Lee</surname> <given-names>JA</given-names></name>
<etal/>
</person-group>. 
<article-title>Diagnostic accuracy of elastography and magnetic resonance imaging in patients with NAFLD: A systematic review and meta-analysis</article-title>. <source>J Hepatol</source>. (<year>2021</year>) <volume>75</volume>:<page-range>770&#x2013;85</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jhep.2021.04.044</pub-id>, PMID: <pub-id pub-id-type="pmid">33991635</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<label>27</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pennisi</surname> <given-names>G</given-names></name>
<name><surname>Enea</surname> <given-names>M</given-names></name>
<name><surname>Falco</surname> <given-names>V</given-names></name>
<name><surname>Aithal</surname> <given-names>GP</given-names></name>
<name><surname>Palaniyappan</surname> <given-names>N</given-names></name>
<name><surname>Yilmaz</surname> <given-names>Y</given-names></name>
<etal/>
</person-group>. 
<article-title>Noninvasive assessment of liver disease severity in patients with nonalcoholic fatty liver disease (NAFLD) and type 2 diabetes</article-title>. <source>Hepatology</source>. (<year>2023</year>) <volume>78</volume>:<fpage>195</fpage>&#x2013;<lpage>211</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1097/HEP.0000000000000351</pub-id>, PMID: <pub-id pub-id-type="pmid">36924031</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<label>28</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Deng</surname> <given-names>M</given-names></name>
<name><surname>Wen</surname> <given-names>Y</given-names></name>
<name><surname>Yan</surname> <given-names>J</given-names></name>
<name><surname>Fan</surname> <given-names>Y</given-names></name>
<name><surname>Wang</surname> <given-names>Z</given-names></name>
<name><surname>Zhang</surname> <given-names>R</given-names></name>
<etal/>
</person-group>. 
<article-title>Comparative effectiveness of multiple different treatment regimens for nonalcoholic fatty liver disease with type 2 diabetes mellitus: a systematic review and Bayesian network meta-analysis of randomised controlled trials</article-title>. <source>BMC Med</source>. (<year>2023</year>) <volume>21</volume>:<fpage>447</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12916-023-03129-6</pub-id>, PMID: <pub-id pub-id-type="pmid">37974258</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<label>29</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Shi</surname> <given-names>R</given-names></name>
<name><surname>Chai</surname> <given-names>K</given-names></name>
<name><surname>Wang</surname> <given-names>H</given-names></name>
<name><surname>Zhou</surname> <given-names>J</given-names></name>
<name><surname>Yang</surname> <given-names>S</given-names></name>
<name><surname>Li</surname> <given-names>J</given-names></name>
<etal/>
</person-group>. 
<article-title>Clinical assessment of common medications for nonalcoholic fatty liver disease: A systematic review and Bayesian network meta-analysis</article-title>. <source>J Evid Based Med</source>. (<year>2025</year>) <volume>18</volume>:<elocation-id>e70002</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/jebm.70002</pub-id>, PMID: <pub-id pub-id-type="pmid">39963857</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<label>30</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ebrahimzadeh</surname> <given-names>A</given-names></name>
<name><surname>Mohseni</surname> <given-names>S</given-names></name>
<name><surname>Safargar</surname> <given-names>M</given-names></name>
<name><surname>Mohtashamian</surname> <given-names>A</given-names></name>
<name><surname>Niknam</surname> <given-names>S</given-names></name>
<name><surname>Bakhoda</surname> <given-names>M</given-names></name>
<etal/>
</person-group>. 
<article-title>Curcumin effects on glycaemic indices, lipid profile, blood pressure, inflammatory markers and anthropometric measurements of non-alcoholic fatty liver disease patients: A systematic review and meta-analysis of randomized clinical trials</article-title>. <source>Complement Ther Med</source>. (<year>2024</year>) <volume>80</volume>:<fpage>103025</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ctim.2024.103025</pub-id>, PMID: <pub-id pub-id-type="pmid">38232906</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<label>31</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Liu</surname> <given-names>N</given-names></name>
<name><surname>Yang</surname> <given-names>J</given-names></name>
<name><surname>Ma</surname> <given-names>W</given-names></name>
<name><surname>Li</surname> <given-names>C</given-names></name>
<name><surname>An</surname> <given-names>L</given-names></name>
<name><surname>Zhang</surname> <given-names>X</given-names></name>
<etal/>
</person-group>. 
<article-title>Xiaoyao Powder in the treatment of non-alcoholic fatty liver disease: A systematic review and meta-analysis</article-title>. <source>J Ethnopharmacol</source>. (<year>2022</year>) <volume>288</volume>:<fpage>114999</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jep.2022.114999</pub-id>, PMID: <pub-id pub-id-type="pmid">35051605</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<label>32</label>
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mou</surname> <given-names>Z</given-names></name>
<name><surname>Gong</surname> <given-names>T</given-names></name>
<name><surname>Wu</surname> <given-names>Y</given-names></name>
<name><surname>Liu</surname> <given-names>J</given-names></name>
<name><surname>Yu</surname> <given-names>J</given-names></name>
<name><surname>Mao</surname> <given-names>L</given-names></name>
</person-group>. 
<article-title>The efficacy and safety of Dachaihu decoction in the treatment of nonalcoholic fatty liver disease: a systematic review and meta-analysis</article-title>. <source>Front Med (Lausanne)</source>. (<year>2024</year>) <volume>11</volume>:<elocation-id>1397900</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmed.2024.1397900</pub-id>, PMID: <pub-id pub-id-type="pmid">39015790</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1014088">Yongsheng Chen</ext-link>, Jinan University, China</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/962042">Boxun Zhang</ext-link>, China Academy of Chinese Medical Sciences, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2091785">Dachuan Jin</ext-link>, The Affiliated Infectious Disease Hospital of Zhengzhou University, China</p></fn>
</fn-group>
</back>
</article>