<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cell Dev. Biol.</journal-id>
<journal-title>Frontiers in Cell and Developmental Biology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cell Dev. Biol.</abbrev-journal-title>
<issn pub-type="epub">2296-634X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1089915</article-id>
<article-id pub-id-type="doi">10.3389/fcell.2022.1089915</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cell and Developmental Biology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Integrated analysis of WGCNA and machine learning identified diagnostic biomarkers in dilated cardiomyopathy with heart failure</article-title>
<alt-title alt-title-type="left-running-head">Zhu et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fcell.2022.1089915">10.3389/fcell.2022.1089915</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Zhu</surname>
<given-names>Yihao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1231544/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Xiaojing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2093598/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zu</surname>
<given-names>Yao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1110992/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>International Research Center for Marine Biosciences</institution>, <institution>Ministry of Science and Technology</institution>, <institution>Shanghai Ocean University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Key Laboratory of Exploration and Utilization of Aquatic Genetic Resources</institution>, <institution>Ministry of Education</institution>, <institution>Shanghai Ocean University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Marine Biomedical Science and Technology Innovation Platform of Lin-gang Special Area</institution>, <addr-line>Shanghai</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1607196/overview">Wei Dai</ext-link>, Fudan University, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2092642/overview">Wei Qin</ext-link>, Oklahoma Medical Research Foundation, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2099090/overview">Chengjian Zhao</ext-link>, Sichuan University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Yao Zu, <email>yzu@shou.edu.cn</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Molecular and Cellular Pathology, a section of the journal Frontiers in Cell and Developmental Biology</p>
</fn>
<fn fn-type="equal" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors have contributed equally to this work and share first authorship</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>05</day>
<month>12</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>10</volume>
<elocation-id>1089915</elocation-id>
<history>
<date date-type="received">
<day>04</day>
<month>11</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>11</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Zhu, Yang and Zu.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Zhu, Yang and Zu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The etiologies and pathogenesis of dilated cardiomyopathy (DCM) with heart failure (HF) remain to be defined. Thus, exploring specific diagnosis biomarkers and mechanisms is urgently needed to improve this situation. In this study, three gene expression profiling datasets (GSE29819, GSE21610, GSE17800) and one single-cell RNA sequencing dataset (GSE95140) were obtained from the Gene Expression Omnibus (GEO) database. GSE29819 and GSE21610 were combined into the training group, while GSE17800 was the test group. We used the weighted gene co-expression network analysis (WGCNA) and identified fifteen driver genes highly associated with DCM with HF in the module. We performed the least absolute shrinkage and selection operator (LASSO) on the driver genes and then constructed five machine learning classifiers (random forest, gradient boosting machine, neural network, eXtreme gradient boosting, and support vector machine). Random forest was the best-performing classifier established on five Lasso-selected genes, which was utilized to select out NPPA, OMD, and PRELP for diagnosing DCM with HF. Moreover, we observed the up-regulation mRNA levels and robust diagnostic accuracies of NPPA, OMD, and PRELP in the training group and test group. Single-cell RNA-seq analysis further demonstrated their stable up-regulation expression patterns in various cardiomyocytes of DCM patients. Besides, through gene set enrichment analysis (GSEA), we found TGF-&#x3b2; signaling pathway, correlated with NPPA, OMD, and PRELP, was the underlying mechanism of DCM with HF. Overall, our study revealed NPPA, OMD, and PRELP serving as diagnostic biomarkers for DCM with HF, deepening the understanding of its pathogenesis.</p>
</abstract>
<kwd-group>
<kwd>dilated cardiomyopathy</kwd>
<kwd>heart failure</kwd>
<kwd>diagnostic biomarker</kwd>
<kwd>weighted gene coexpression network analysis</kwd>
<kwd>machine learning</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>As the most common primary cardiomyopathy, dilated cardiomyopathy (DCM), is characterized by left ventricular dilation along with systolic dysfunction (<xref ref-type="bibr" rid="B48">Weintraub et al., 2017</xref>). The clinical manifestation of DCM ranges from none to overt symptoms of heart failure (HF) (<xref ref-type="bibr" rid="B30">McNally and Mestroni, 2017</xref>). Accordingly, there is no specific clinical manifestation for the diagnosis of DCM. Most patients with DCM usually have a progressively worsening condition, leading to advanced HF and ultimate death (<xref ref-type="bibr" rid="B27">Mahmaljy et al., 2022</xref>; <xref ref-type="bibr" rid="B53">Zheng et al., 2022</xref>). DCM is an essential cause of HF, and advanced HF in DCM is a leading indication for heart transplantation (<xref ref-type="bibr" rid="B41">Seferovi&#x107; et al., 2019</xref>). The estimated prevalence of DCM is 1 case per 250 individuals (<xref ref-type="bibr" rid="B41">Seferovi&#x107; et al., 2019</xref>). Notably, the reported incidence of DCM in patients with HF varied greatly (8%&#x2013;47%) due to the precise diagnosis lacking (<xref ref-type="bibr" rid="B41">Seferovi&#x107; et al., 2019</xref>). There are many etiologies of DCM, most of which are idiopathic (<xref ref-type="bibr" rid="B30">McNally and Mestroni, 2017</xref>; <xref ref-type="bibr" rid="B27">Mahmaljy et al., 2022</xref>; <xref ref-type="bibr" rid="B29">McDonagh et al., 2022</xref>). Etiologies of HF in DCM mainly include inherited (pathogenic gene mutations) and various acquired causes (infectious or toxic agents, auto-immunity, endocrine or metabolic abnormalities) (<xref ref-type="bibr" rid="B41">Seferovi&#x107; et al., 2019</xref>; <xref ref-type="bibr" rid="B29">McDonagh et al., 2022</xref>). To date, mutations in genes coding for cytoskeletal, contractile proteins, nuclear membrane, ion channels, and intercellular junction molecules has been proven to be associated with DCM (<xref ref-type="bibr" rid="B19">Japp et al., 2016</xref>; <xref ref-type="bibr" rid="B41">Seferovi&#x107; et al., 2019</xref>). Among these genetic variants in DCM, inherited mutations of TTN, LMNA, MYH7, MYH6, TNNT2, and ACTC1 are the leading causes (<xref ref-type="bibr" rid="B11">Fatkin et al., 1999</xref>; <xref ref-type="bibr" rid="B42">Seidman and Seidman, 2001</xref>; <xref ref-type="bibr" rid="B14">Gerull et al., 2002</xref>; <xref ref-type="bibr" rid="B7">Carniel et al., 2005</xref>; <xref ref-type="bibr" rid="B28">Mazzarotto et al., 2020</xref>). During recent decades, continuously improving diagnosis and treatment strategies (including early diagnosis development, advanced pharmacological treatments, and device therapies) have greatly improved the prognosis and survival of DCM patients (<xref ref-type="bibr" rid="B31">Merlo et al., 2014</xref>). However, the etiologies and pathogenesis of DCM with HF have not been fully understood, resulting in non-specific treatment. Heart transplantation remains the only viable approach for treating DCM with advanced HF (<xref ref-type="bibr" rid="B18">Iwata et al., 2020</xref>). Therefore, novel mechanisms needed to be elucidated to improve this situation. Besides, developing a precise diagnosis approach for DCM with HF is equally significant.</p>
<p>In this study, we conducted a series of bioinformatics analyses and machine learning classifiers to identify the underlying genes as diagnostic biomarkers for DCM with HF patients, which might provide insight into diagnosis and treatment for DCM with HF. The overall study design was shown in <xref ref-type="sec" rid="s11">Supplementary Figure S1</xref>. First, three gene expression profiling datasets of DCM with HF (GSE29819, GSE21610, GSE17800) were downloaded from the GEO database. GSE29819 and GSE21610 were merged into the training group, while GSE17800 was the test group for validation. Second, we performed Principal Component Analysis (PCA) on the training group to evaluate data dispersion and then screened out the differential expression genes (DEGs) between the control and DCM with HF patients. Third, we explored the potential biological functions, signaling pathways, and correlated diseases of the up-regulated DEGs. Fourth, the gene co-expression network was constructed, and driver genes of identified module closely associated with DCM with HF were extracted. Next, we identified the intersection of the driver genes and up-regulated genes as the feature genes for DCM with HF. Fifth, within the training and test groups, Back Propagation Neural Network (BPNN) established on these feature genes was utilized to classify the normal and DCM with HF patients (<xref ref-type="bibr" rid="B36">Ruan et al., 2021</xref>). We assessed the classified accuracy of BPNN with the Area Under Curve (AUC) score of the Receiver Operating Characteristic (ROC) curve. Sixth, the least absolute shrinkage and selection operator (Lasso) was first conducted to narrow down the feature gene sets and five well-established classifiers (Random Forest, Gradient Boosting Machine, Neural Network, eXtreme Gradient Boosting, Support Vector Machine) (<xref ref-type="bibr" rid="B17">Han et al., 2014</xref>; <xref ref-type="bibr" rid="B43">Sheridan et al., 2016</xref>; <xref ref-type="bibr" rid="B34">Olson et al., 2018</xref>; <xref ref-type="bibr" rid="B50">Yang et al., 2020</xref>; <xref ref-type="bibr" rid="B36">Ruan et al., 2021</xref>) on the Lasso-selected features were applied. In the training group and test group, the classifier performed with the minimum residual and maximum AUC score was considered the most robust for selecting the critical features (key genes) as biomarkers for diagnosing DCM with HF (<xref ref-type="bibr" rid="B35">Pan et al., 2021</xref>). Seventh, we analyzed the mRNA expression levels and diagnosis abilities of key genes in the training group and test group. Moreover, we carried out single-cell RNA-sequencing analysis on GSE95140, thus demonstrating the expression distributions and dynamic changes of key genes in damaged cardiomyocytes of DCM patients. We then investigated and inferred the potential pathways of key genes by integrating the Gene Set Enrichment Analysis (GSEA) with Pearson&#x2019;s correlation analysis. Overall, our research identified promising diagnostic biomarkers from integrating WGCNA and machine learning and might be a fresh perspective to understand the development of DCM with HF.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and methods</title>
<sec id="s2-1">
<title>Data collection and processing</title>
<p>Three gene expression profiles of DCM with HF (GSE29819, GSE21610, GSE17800) and one single-cell RNA-sequencing dataset of DCM (GSE95140) were downloaded from the GEO database (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>). First, GSE29819 and GSE21610 were merged into the training group for major analysis, containing 20 normal myocardial tissues and 35 myocardial tissues derived from DCM patients with HF (<xref ref-type="bibr" rid="B39">Schwientek et al., 2010</xref>; <xref ref-type="bibr" rid="B13">Gaertner et al., 2012</xref>). GSE17800 was the test group for validation, including nine normal myocardial tissues and 40 myocardial tissues from DCM patients with HF (<xref ref-type="bibr" rid="B3">Ameling et al., 2013</xref>). GSE29819, GSE21610, and GSE17800 were based on the GPL570 sequencing platform. And a total of 21,628 genes and 21,654 genes were obtained in the training group and test group, respectively. The probes were annotated to official gene symbols using the Perl programming. Next, we performed log2 transformation and then normalized the raw count expression data using the function &#x201c;normalizeBetweenArrays&#x201d; of the R package &#x201c;limma&#x201d;. For the training group, the function &#x201c;ComBat&#x201d; of the R package &#x201c;sva&#x201d; was then utilized to remove the batch effect of GSE29819 and GSE21610. Moreover, heart specimens from normal individuals and 10 DCM patients were obtained from GSE95140 for further verification and single-cell RNA-seq analysis (<xref ref-type="bibr" rid="B33">Nomura et al., 2018</xref>). The sequencing platform of GSE95140 was GPL16791.</p>
</sec>
<sec id="s2-2">
<title>Principal component analysis and identification of DEGs</title>
<p>To assess the dispersion between the control group and DCM with HF group, PCA was performed and two components were extracted. Then, the R package &#x201c;limma&#x201d; was utilized to screen the DEGs between control and DCM with HF samples. The cutoff criteria of DEGs was &#x7c;log<sub>2</sub>Fold Change (log<sub>2</sub>FC) &#x7c; &#x3e; 1 and adjusted <italic>p</italic> &#x3c; 0.05 (<xref ref-type="bibr" rid="B9">Chen et al., 2018</xref>). The Volcano plot of all DEGs and the clustering heatmap of the top 50 up-regulated genes and top 50 down-regulated genes were plotted by the R packages &#x201c;ggplot2&#x201d; and &#x201c;pheatmap&#x201d;, respectively.</p>
</sec>
<sec id="s2-3">
<title>Gene functional, pathway, and, disease enrichment analysis of up-regulated DEGs</title>
<p>To investigate the potential biological function, pathways, and related diseases of up-regulated DEGs, the R packages &#x201c;clusterProfiler&#x201d; and &#x201c;DOSE&#x201d; were used for Gene Ontology (GO), Kyoto Encyclopedia of Genes and Genomes (KEGG), and Disease Ontology (DO) enrichment analyses. The enrichment GO terms, KEGG pathways, and DO terms with <italic>q</italic> &#x3c; 0.05 were considered significant. Furthermore, we used the R package &#x201c;CBNplot&#x201d; to infer the Bayesian network (BN) on the gene expression profiles and KEGG enrichment analysis, showing the relationships between genes in the enriched pathways (<xref ref-type="bibr" rid="B37">Sato et al., 2022</xref>).</p>
</sec>
<sec id="s2-4">
<title>Construction of gene Co-expression network and identification of the modules</title>
<p>The R package &#x201c;WGCNA&#x201d; was used to construct the gene co-expression network and identify the modules correlated to DCM with HF (<xref ref-type="bibr" rid="B24">Langfelder and Horvath, 2008</xref>). First, a total of 9,379 genes with standard deviation (SD) of expression larger than 0 in the training group were selected for analysis. Second, the function &#x201c;hclust&#x201d; was used to cluster the samples to exclude the outliers. Third, a similarity matrix was obtained by calculating each pairwise gene correlation. It was then converted to an adjacency matrix using the soft adjacency function <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:msub>
<mml:mi>A</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mfenced open="|" close="|" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mi>&#x3b2;</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, where <italic>i</italic> and <italic>j</italic> were any two of 9,379 genes, <italic>&#x3b2;</italic> is the soft threshold power, <italic>S</italic>
<sub>
<italic>ij</italic>
</sub> is the similarity matrix, and <italic>A</italic>
<sub>
<italic>ij</italic>
</sub> is the adjacency matrix. The function &#x201c;pickSoftThreshold&#x201d; selected the optimal soft threshold power (<italic>&#x3b2;</italic> &#x3d; 1&#x2013;20) to establish the scale-free topology. The optimal soft threshold power was also graphically validated by the high scale-free topology <italic>R</italic>
<sup>2</sup> between log10(k) and log10 (p(k)), where k is the connectivity between genes and p(k) means the probability of connectivity. Fourth, the adjacency matrix was turned into a Topological Overlap Matrix (TOM). The functions &#x201c;pickSoftThreshold&#x201d; and &#x201c;plotDendroAndColors&#x201d; were conducted to identify the modules and then plot the clustering dendrogram of genes together with dissimilarity on the topological overlap and various module colors. Herein, the parameters &#x201c;minModuleSize&#x201d; and &#x201c;MEDissThres&#x201d; were set to 60 and 0.3, respectively. Fifth, module-trait correlation analysis was performed to reveal the ME blue module as the most important one related to DCM with HF. Subsequently, the Gene significance (GS) and Module Membership (MM) were calculated by intramodular analysis. Genes with GS &#x3e; 0.5 and MM &#x3e; 0.8 were identified as driver genes in the ME blue module for further study (<xref ref-type="bibr" rid="B1">Ai et al., 2020</xref>).</p>
</sec>
<sec id="s2-5">
<title>Construction and validation of BPNN on feature genes</title>
<p>The intersection of up-regulated DEGs and driver genes in the ME blue module was identified as feature genes for DCM with HF. Next, the clustering heatmap of the feature gene expression was plotted using the R package &#x201c;pheatmap&#x201d;. BPNN, typically composed of processing elements arranged in at least three layers (input, hidden, and output layers), is a multilayer feedforward network trained on an error-back propagation algorithm (<xref ref-type="bibr" rid="B22">Kaundal et al., 2006</xref>). Here, BPNN was constructed in the training group based on feature genes and then validated in the test group using the R package &#x201c;neuralnet&#x201d;. For BPNN, the input and output layer neurons are equal to the feature gene number and the classification number (control or DCM with HF), respectively. According to common rule-of-thumb methods, the hidden layer neurons were determined and adjusted by 1/3&#x2013;2/3 of the input layer neurons (<xref ref-type="bibr" rid="B21">Karsoliya, 2012</xref>). Accordingly, the neuron numbers of the input layer, hidden layer, and output layer were set as 13, 5, and 2, respectively. The classification accuracies of BNPP in the training and test groups were evaluated by the AUC score of the ROC curve by the R package &#x201c;pROC&#x201d;. Additionally, we visualized Pearson&#x2019;s correlation among the 13 feature genes by the R package &#x201c;corrplot&#x201d;.</p>
</sec>
<sec id="s2-6">
<title>Construction and evaluation of RF, GBM, NN, XGBoost, and SVM</title>
<p>To narrow down the numbers of feature genes, Lasso was first performed to carry out feature selection. Five machine learning classifiers (RF, GBM, NN, XGBoost, and SVM) were then constructed for further feature selection on the Lasso-selected genes (<xref ref-type="bibr" rid="B17">Han et al., 2014</xref>). These models were all constructed through 10-fold cross-validation. The setting paraments of RF, NN, and SVM were 400 decision trees, five neurons in the hidden layer, and radial kernel. And paraments set by default for GBM and XGBoost. By using the R package &#x201c;glmnet&#x201d;, Lasso was first applied to reduce gene numbers for screening the feature genes. Then, five machine learning classifiers were established in the training and test groups based on the Lasso-selected feature genes using the R package &#x201c;caret&#x201d;. The classification performances of five models in the training and test groups were assessed by AUC scores using the package &#x201c;pROC&#x201d;. The residual and feature importance of classifiers were analyzed by the R package &#x201c;DALEX&#x201d;. Net Benefit (NB) calculated by Decision Curve Analysis (DCA) and Brier score were also utilized to measure the clinical value and calibration of classifiers, respectively (<xref ref-type="bibr" rid="B12">Fitzgerald et al., 2015</xref>; <xref ref-type="bibr" rid="B2">Alba et al., 2017</xref>). In general, the classifier with the lowest residual, minimum Brier score, highest AUC, and maximum NB was considered the best predictive classifier for further feature selection. Herein, RF was selected as the best-performing classifier for accurately distinguishing between normal and DCM with HF groups. Using the LASSO-selected genes, the R packages &#x201c;caret&#x201d; and &#x201c;randomForest&#x201d; were used to build an RF classifier in the training and test groups. The feature importance of RF was investigated by using the Gini gain approach. Feature genes with a mean decrease Gini larger than two were selected as key genes for diagnosing DCM with HF (<xref ref-type="bibr" rid="B47">Tian et al., 2020</xref>).</p>
</sec>
<sec id="s2-7">
<title>Differentially expression, diagnostic accuracy, and target therapeutic drug prediction analyses of key genes</title>
<p>Then, within the training and test groups, we analyzed the expression distribution and diagnostic accuracy of key genes selected by RF. By using the R package &#x201c;ggpubr&#x201d;, the boxplots were plotted and demonstrated the differential expression distributions of key genes between control and DCM with HF groups. The diagnostic accuracies of key genes for DCM with HF were evaluated by the AUC score of the ROC curve using the R packages &#x201c;pROC&#x201d;. Furthermore, we established a logistic regression model for evaluating the diagnostic accuracy of the key genes&#x2019; combination using the R package &#x201c;glmnet&#x201d;. Furthermore, the nomogram was used to illustrate and visualize the logistic regression model by the R package &#x201c;rms&#x201d;. The calibration curve and NB calculated by DCA were utilized to evaluate the prediction effect of the nomogram. The gene with an AUC score ranging from 0.85 to 1.0 was considered to have excellent specificity and sensitivity to distinguish between the control group and DCM with HF group. The Human Protein Atlas (HPA) database (<ext-link ext-link-type="uri" xlink:href="https://www.proteinatlas.org/">https://www.proteinatlas.org/</ext-link>) was used to explore the extracellular locations and tissue-specific expression levels of the key genes. Moreover, Drug Signatures Database (DSigDB) (<ext-link ext-link-type="uri" xlink:href="https://maayanlab.cloud/Enrichr/">https://maayanlab.cloud/Enrichr/</ext-link>) (<xref ref-type="bibr" rid="B23">Kuleshov et al., 2016</xref>) was applied to predict potential therapeutic drugs target for three key genes, with adjusted <italic>p</italic> &#x3c; 0.05 as the filtering threshold.</p>
</sec>
<sec id="s2-8">
<title>Assessment of key genes expression on single-cell RNA-seq data</title>
<p>To further confirm the differential expression of key genes in DCM with HF, we performed single-cell RNA-seq analysis on GSE95140, mainly including cell type identification and Pseudotime-ordered analysis. First, we performed quality control and data cleaning using the R package &#x201c;dplyr&#x201d;. The screening criteria were set: the number of genes in each cell ranges from 200 to 7,500, and the percentage of mitochondrial genes in each cell is lower than 20%. Second, the function &#x201c;NormalizeData&#x201d; of the R package &#x201c;seruat&#x201d; was used to perform log2 transformation on the raw count data. Next, the top 2000 hypervariable genes were selected by the function &#x201c;FindVariableFeatures&#x201d;. Z-score standardization was conducted using the function &#x201c;ScaleData&#x201d;. Third, PCA was carried out on the hypervariable genes in the control and DCM groups. Next, two PCs (control group, all <italic>p</italic> &#x3c; 0.01) and four PCs (DCM group, all <italic>p</italic> &#x3c; 0.01) were selected. Then, two clusters (control group) and four clusters (DCM group) were obtained and projected onto UMAP plots, respectively. Fourth, the marker genes of cardiomyocyte (NNT2, MYH7), fibroblast (DCN, COL1A1), and endothelial cell (CDH5, VWF) obtained from CellMarker 2.0 database (<ext-link ext-link-type="uri" xlink:href="http://yikedaxue.slwshop.cn/">http://yikedaxue.slwshop.cn/</ext-link>) (<xref ref-type="bibr" rid="B51">Zhang et al., 2019</xref>) were used to identify cardiomyocytes in different states. We then explored the expression distribution of key genes and NPPB in the control and DCM groups. NPPB, an important paralog of NPPA with up-regulation in DCM with HF (<xref ref-type="bibr" rid="B5">Barth et al., 2006</xref>), was selected as an indicator to reveal whether the key genes showed co-expression and dynamic expression patterns of NPPB. Fifth, the R package &#x201c;monocle&#x201d; was used to conduct Pseudotime-ordered analysis using the &#x201c;DDRTree&#x201d; method on the DCM group. Using the function &#x201c;plot_cell_trajectory&#x201d;, the differentiation trajectory of cardiomyocytes was visualized in the tree diagram. Additionally, we analyzed and visualized the dynamic expression patterns of key genes and NPPB during the cardiomyocyte transitions across the Pseudotime using the function &#x201c;plot_genes_in_pseudotime&#x201d;.</p>
</sec>
<sec id="s2-9">
<title>Inference of pathways regulated by key genes in DCM with HF</title>
<p>Considering the limitation of performing KEGG on small gene sets, GSEA was utilized to explore the potential pathways of key genes. We conducted GSEA on the training group using the R package &#x201c;clusterProfiler&#x201d;. The KEGG gene sets annotated for GSEA (c2.cp.kegg.v7.5.1.symbols) were downloaded from the MSigDB database (<ext-link ext-link-type="uri" xlink:href="http://www.gsea-msigdb.org/gsea/msigdb/index.jsp">http://www.gsea-msigdb.org/gsea/msigdb/index.jsp</ext-link>). First, the samples were divided into low- and high-expression groups according to the median expression of NPPA, OMD, and PRELP, respectively. Then, we ranked 21,628 genes in descending order by calculating the log<sub>2</sub>FC for each gene. Second, the GSEA was performed on these ranked genes using the KEGG gene sets. The enrichment KEGG pathways with <italic>p</italic> &#x3c; 0.05 and &#x7c;Normalized Enrichment Score (NES)&#x7c; &#x3e; 1 were considered significant (<xref ref-type="bibr" rid="B53">Zheng et al., 2022</xref>). NES was the primary statistic to examine the enrichment results, the value indicates the relationships between enrichment pathways and key genes. Herein, the intersection of enrichment KEGG pathways of each key gene was determined as the potential pathway in DCM with HF. Subsequently, we carried out Pearson&#x2019;s correlation analysis between each key gene and the potential pathway-related genes. &#x7c;<italic>R</italic>&#x7c; &#x3e; 0.3 and <italic>p</italic> &#x3c; 0.05 was the cutoff criteria. The intersection of pathway genes significantly correlated with each key gene was considered important and used for further analysis. Next, the Pathview online tool (<ext-link ext-link-type="uri" xlink:href="https://pathview.uncc.edu/home">https://pathview.uncc.edu/home</ext-link>) (<xref ref-type="bibr" rid="B25">Luo et al., 2017</xref>) was used to perform Z-score normalization on the expressions of these intersection genes between control and DCM with HF groups and projected their relative expression values onto the KEGG pathway.</p>
</sec>
<sec id="s2-10">
<title>Statistical analysis</title>
<p>Statistical analysis was conducted using R programming language (version 4.2.1). Wilcoxon test was performed to analyze the differential expression of key genes in DCM with HF group versus control group. The diagnostic ability of each key gene was evaluated by the AUC score. <italic>P</italic> &#x3c; 0.05 was considered statistically significant.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>Identification of DEGs in DCM with HF</title>
<p>The gene expression matrices of the training group were obtained after data cleaning, normalization, batch effect removal, and merging, including 20 normal myocardial samples (control group) and 35 myocardial samples derived from DCM patients with HF (DCM with HF group). The PCA score plot showed the relatively consistent clustering of two groups from two components (<xref ref-type="fig" rid="F1">Figure 1A</xref>), which can be used in subsequent analysis due to between-group differences. A total of 218 DEGs (135 up-regulated genes and 83 down-regulated genes) were screened under the threshold (&#x7c;log<sub>2</sub>FC&#x7c; &#x3e; 1 and adjusted <italic>p</italic> &#x3c; 0.05). The Volcano plot of DEGs was then plotted using the log<sub>2</sub>FC and -log10 (adjusted <italic>p</italic>) (<xref ref-type="fig" rid="F1">Figure 1B</xref>). The top 50 up-regulated genes and the top 50 down-regulated genes were shown in the heatmap (<xref ref-type="fig" rid="F1">Figure 1C</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Data processing and identification of DEGs. <bold>(A)</bold> PCA score plot of the training group dataset after batch removal showing the difference between control and DCM with HF groups. <bold>(B)</bold> Volcano plot of DEGs. Red dots represent up-regulated genes and blue dots represent down-regulated genes. <bold>(C)</bold> Heatmap displaying a differential expression of the top 50 up-regulated genes and top 50 down-regulated genes.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g001.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>Inference of biological functions, pathways, and diseases for up-regulated DEGs</title>
<p>The GO, KEGG, and DO enrichment analyses were conducted to annotate the potential functions, pathways, and diseases of 135 up-regulated DEGs, respectively. As shown in <xref ref-type="fig" rid="F2">Figure 2A</xref>, the enrichment GO terms of biological process (BP) included muscle cell migration, striated muscle adaptation, and skeletal muscle adaptation; the enrichment GO terms of cellular component (CC) included collagen&#x2212;containing extracellular matrix, myofilament, and striated muscle thin filament; the enrichment GO terms of molecular function (MF) included integrin binding, cytokine activity, and extracellular matrix structural constituent. DO enrichment analysis showed that the DEGs were associated with many heart diseases, such as arteriosclerotic cardiovascular disease, coronary artery disease, and myocardial infarction (<xref ref-type="fig" rid="F2">Figure 2B</xref>). Additionally, the enriched KEGG pathways mainly contained muscle contraction, post-translational protein phosphorylation, and regulation of Insulin-like Growth Factor (IGF) transport and uptake by Insulin-like Growth Factor Binding Proteins (IGFBPs) (<xref ref-type="fig" rid="F2">Figure 2C</xref>).The BN plot further demonstrated the enriched gene interactions in muscle contraction (<xref ref-type="fig" rid="F2">Figure 2D</xref>). Furthermore, NPPA acted as the core gene with higher expression and more edges, indicating its crucial role in muscle contraction.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Potential biological function, pathways, and associated diseases of up-regulated DEGs. <bold>(A)</bold> GO enrichment analysis of up-regulated DEGs. <bold>(B)</bold> DO enrichment analysis of up-regulated DEGs. <bold>(C)</bold> KEGG enrichment analysis of up-regulated DEGs. <bold>(D)</bold> Bayesian network plot showing the regulatory relationships of genes in muscle contraction.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g002.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>Weighted gene co-expression network construction</title>
<p>WGCNA was utilized to construct the gene co-expression network and identify the trait-correlated modules in the training group. First, the similarity matrix was calculated and then transformed into the adjacent matrix via the optimal soft threshold power (<italic>&#x3b2;</italic> &#x3d; 2) (<xref ref-type="fig" rid="F3">Figures 3A,B</xref>). Besides, the inverse relationship of p(k) and k was observed (<xref ref-type="fig" rid="F3">Figure 3C</xref>), and the scale-free topology <italic>R</italic>
<sup>2</sup> of log10(k) and log10 (p(k)) was 0.87 when <italic>&#x3b2;</italic> &#x3d; 2 (<xref ref-type="fig" rid="F3">Figure 3D</xref>), which illustrated <italic>&#x3b2;</italic> &#x3d; 2 was suitable for constructing a scale-free topology. Second, the TOM was converted from the adjacent matrix and turned into the dissTOM (dissTOM &#x3d; 1-TOM) for hierarchical clustering. Dynamic tree shearing clustered the similarity genes based on the topological overlap and then divided them into various modules (<xref ref-type="fig" rid="F4">Figure 4A</xref>). Third, we related the modules to clinical trait and further obtained the driver genes in the strongest positive correlation module. As shown in <xref ref-type="fig" rid="F4">Figure 4B</xref>, we ultimately identified the ME blue module strongly positively related to DCM with HF (<italic>R</italic> &#x3d; 0.77, <italic>p</italic> &#x3c; 0.001), containing 2,411 genes. Fourth, the significant GS distribution across the seven modules was observed (<xref ref-type="fig" rid="F4">Figure 4C</xref>). Additionally, the intramodular analysis demonstrated the close relationship between MM and GS of the ME blue module (<italic>R</italic> &#x3d; 0.81, <italic>p</italic> &#x3c; 0.001; <xref ref-type="fig" rid="F4">Figure 4D</xref>), thus relieving the module genes highly associated with DCM with HF. Finally, a total of 15 genes with GS &#x3e; 0.5 and MM &#x3e; 0.8 (C14orf132, CFH, COL8A1, CTGF, ETNPPL, FIBIN, FRZB, ITGBL1, LTBP2, MFAP4, NPPA, NRK, OMD, PRELP, SFRP4) were identified as driver genes in the ME blue module.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Determination of optimal soft threshold power for scale-free topology. <bold>(A)</bold> The scale-free topology fit index (<italic>R</italic>
<sup>2</sup>) for soft threshold power (<italic>&#x3b2;</italic>) from 1 to 20. <bold>(B)</bold> The mean connectivity (k) for <italic>&#x3b2;</italic> from 1 to 20. <bold>(C)</bold> Histogram of connectivity frequency. <bold>(D)</bold> The scale-free topology <italic>R</italic>
<sup>2</sup> between log<sub>10</sub>(k) and log<sub>10</sub> (p(k)) when <italic>&#x3b2;</italic> &#x3d; 2.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g003.tif"/>
</fig>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Identification of driver genes in module related to DCM with HF. <bold>(A)</bold> Dendrogram of all genes with dissimilarity clustered on topological overlap. <bold>(B)</bold> Correlation of seven modules and two traits (control and DCM with HF). The blue module was significantly correlated with DCM with HF (<italic>R</italic> &#x3d; 0.77, <italic>p</italic> &#x3c; 0.001). <bold>(C)</bold> Boxplot of Gene Significance (GS) distribution across seven modules. <bold>(D)</bold> Scatterplot of Module Membership (MM) in the blue module versus GS for DCM with HF.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g004.tif"/>
</fig>
</sec>
<sec id="s3-4">
<title>Construction and validation of BPNN on 13 feature genes</title>
<p>We selected the intersection of 135 up-regulated DEGs and 15 driver genes in the ME blue module as the feature genes of DCM with HF, with a total of 13 genes (OMD, PRELP, NPPA, LTBP2, C14orf132, FIBIN, SFRP4, FRZB, MFAP4, COL8A1, CFH, CTGF, ITGBL1) (<xref ref-type="fig" rid="F5">Figure 5A</xref>). These 13 genes were previously proved to participate in muscle contraction, striated muscle adaptation, and extracellular matrix structural constituent (<xref ref-type="fig" rid="F2">Figures 2A,B</xref>), indicating their potential crucial roles in DCM with HF. <xref ref-type="fig" rid="F5">Figure 5B</xref> showed the differential expressions of feature genes between control and DCM with HF groups. Subsequently, a BPNN with 13 neurons in the input layer (13 feature genes), five neurons in the hidden layer, and two neurons in the output layer (classification numbers: control or DCM with HF) was constructed in the training group and then validated in the test group (<xref ref-type="fig" rid="F5">Figure 5C</xref>). The BPNN showed prediction accuracy with a high AUC score of 0.988 in the training group (<xref ref-type="fig" rid="F5">Figure 5D</xref>). However, the predictive power of BNPP decreased significantly in the test group compared to the training group, merely achieving an AUC score of 0.745 (<xref ref-type="fig" rid="F5">Figure 5E</xref>). These results suggested that the collinearity between the screened 13 feature genes resulted in the constructed BPNN over-fitting for general prediction (<xref ref-type="sec" rid="s11">Supplementary Figure S2</xref>). Thus, feature selection was crucial for further obtaining the key genes for the diagnosis of DCM with HF.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Construction and validation of BPNN on 13 feature genes. <bold>(A)</bold> The intersection of 135 up-regulated genes and 15 driver genes in the blue module as feature genes. <bold>(B)</bold> Expression heatmap of 13 feature genes in control and DCM with HF groups. <bold>(C)</bold> BPNN constructed with 13 neurons in the input layer, five neurons in the hidden layer, and two neurons in the output layer. ROC curve for evaluating classification accuracy in the training group <bold>(D)</bold> and test group <bold>(E)</bold>. I, input layer; H, hidden layer; O, output layer; B, bias.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g005.tif"/>
</fig>
</sec>
<sec id="s3-5">
<title>NPPA, OMD, and PRELP were the key genes for DCM with HF</title>
<p>To narrow down the range of feature genes, Lasso within the training group was first performed. As shown in <xref ref-type="fig" rid="F6">Figure 6A</xref>, Lasso retained five genes from 13 feature genes under the optimal log(&#x3bb;) as 0.0156. Through the 10-fold cross-validation, the minimum binomial deviation with optimal log(&#x3bb;) was observed, indicating the five genes were optimally selected by Lasso (<xref ref-type="fig" rid="F6">Figure 6B</xref>). Second, five machine learning models (RF, GBM, NN, XGBoost, and SVM) were established on the five LASSO-selected genes and validated their classification performances based on a series of indexes (residual, Brier score, AUC score, NB) in the training and test groups. Strikingly, the RF model showed robust classification ability, with the lowest residual (<xref ref-type="fig" rid="F6">Figure 6C</xref>) and Brier score (<xref ref-type="sec" rid="s11">Supplementary Table S1</xref>), highest AUC achieving 1 (<xref ref-type="sec" rid="s11">Supplementary Figures S3A,C</xref>), and NB under threshold probability (<xref ref-type="sec" rid="s11">Supplementary Figures S3B,D</xref>) in the training and test groups. Thus, the RF classifier was considered the most suitable performance classifier for further feature selection. Moreover, the importance of feature genes selected from five classifiers was illustrated by Root Mean Square Error (RMSE) loss (<xref ref-type="fig" rid="F6">Figure 6D</xref>). Third, we constructed the RF model with 400 decision trees (<xref ref-type="fig" rid="F6">Figure 6E</xref>), and three features with mean decrease Gini coefficients larger than 2 (OMD, PRELP, NPPA) were selected as key genes for diagnosing DCM with HF (<xref ref-type="fig" rid="F6">Figure 6F</xref>).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Obtaining the key genes for the diagnosis of DCM with HF. <bold>(A)</bold> The coefficients of 13 feature genes shown by log(&#x3bb;). <bold>(B)</bold> The relationship between binomial deviation and log(&#x3bb;) by 10-fold cross-validation (CV). <bold>(C)</bold> Residual diagram of Random Forest (RF), Gradient Boosting Machine (GBM), Neural Network (NN), eXtreme Gradient Boosting (XGBoost), and Support Vector Machine (SVM) classification. <bold>(D)</bold> Root Mean Square Error (RMSE) loss after feature removal from models. <bold>(E)</bold> The effect of decision tree number on CV error of RF classifier. Green, red, and black curves represent the error of control, DCM with HF, and total groups, respectively. <bold>(F)</bold> The mean decrease Gini coefficients of genes in the RF classifier. OMD, PRELP, and NPPA were the key genes with mean decrease Gini larger than 2.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g006.tif"/>
</fig>
</sec>
<sec id="s3-6">
<title>NPPA, OMD, and PRELP were up-regulated with diagnostic abilities in DCM with HF</title>
<p>To test whether NPPA, OMD, and PRELP could serve as the diagnostic biomarkers of DCM with HF, their mRNA expression levels and diagnostic abilities were then analyzed. As shown in <xref ref-type="fig" rid="F7">Figures 7A,B</xref>, the over-expression levels of NPPA, OMD, and PRELP were observed in DCM with HF in the training group and test group. Furthermore, the AUC scores of NPPA (AUC &#x3d; 0.967), OMD (AUC &#x3d; 0.984), PRELP (AUC &#x3d; 0.974), and their combination (AUC &#x3d; 0.986) for diagnosing DCM with HF were all larger than 0.9 in the training group (<xref ref-type="fig" rid="F7">Figure 7C</xref>). The AUC scores of NPPA (AUC &#x3d; 0.863), OMD (AUC &#x3d; 0.722), and PRELP (AUC &#x3d; 0.816) decreased in the test group (<xref ref-type="fig" rid="F7">Figure 7D</xref>). However, the AUC score of the combination of NPPA, OMD, and PRELP markedly achieved 0.922 within the test group. These results suggested NPPA, OMD, and PRELP be promising diagnostic biomarkers for DCM with HF. To measure the combined diagnostic accuracies of NPPA, OMD, and PRELP, a logistic regression model was constructed and displayed in the nomogram (<xref ref-type="sec" rid="s11">Supplementary Figure S4</xref>). Interestingly, the combination of NPPA, OMD, and PRELP improved the diagnostic effect within the training and test groups. We also observed the heart muscle-specific expressions of NPPA, OMD, and PRELP, and their extracellular locations were all predicted to be secreted in the HPA database (<xref ref-type="sec" rid="s11">Supplementary Figure S5</xref>), which provided strong evidence that NPPA, OMD, and PRELP served promising biomarkers of DCM with HF.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Differential expression and diagnostic accuracy of key genes in the training and test groups. The mRNA expression levels of NPPA, OMD, and PRELP between normal hearts and damaged hearts of DCM with HF in the training group <bold>(A)</bold> and test group <bold>(B)</bold>. ROC curves for evaluating diagnostic accuracy of NPPA, OMD, and PRELP in the training group <bold>(C)</bold> and test group <bold>(D)</bold>.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g007.tif"/>
</fig>
</sec>
<sec id="s3-7">
<title>Target therapeutic drug prediction for NPPA</title>
<p>Herein, we used DSigDB to predict the potential therapeutic drugs associated with NPPA, OMD, and PRELP. A total of 17 target drugs related to NPPA were finally predicted, but not associated with OMD and PRELP. And the specific information on the top 10 predicted drugs was shown in <xref ref-type="sec" rid="s11">Supplementary Table S2</xref>. Among these drugs, the antihypertensive efficacy of alprostadil, labetalol, felodipine, and irbesartan has been reported (<xref ref-type="bibr" rid="B20">Johnson and Fugman, 1983</xref>; <xref ref-type="bibr" rid="B26">MacCarthy and Bloomfield, 1983</xref>; <xref ref-type="bibr" rid="B8">Cattaneo et al., 2003</xref>). Additionally, previous studies have shown that irbesartan, furosemide, and Bonuten can treat HF (<xref ref-type="bibr" rid="B20">Johnson and Fugman, 1983</xref>; <xref ref-type="bibr" rid="B45">Swedberg et al., 1987</xref>; <xref ref-type="bibr" rid="B46">Thompson et al., 1999</xref>). Several pieces of evidence have supported that these predictive drugs targeting NPPA could cure some cardiovascular disorders such as hypertension and HF, thus indicating their value in the treatment of DCM with HF.</p>
</sec>
<sec id="s3-8">
<title>Single-cell RNA-seq analysis revealed the over-expression patterns of NPPA, OMD, and PRELP were stable in DCM patients</title>
<p>To investigate the expression patterns of NPPA, OMD, and PRELP in DCM patients, we conducted single-cell RNA-seq analysis on GSE95140. The quality control, data cleaning, and PC selection were shown in <xref ref-type="sec" rid="s11">Supplementary Figure S6</xref>. The entire cell profiles of the control group and DCM group were classified into 2 clusters (<xref ref-type="fig" rid="F8">Figure 8A</xref>) and 3 clusters (<xref ref-type="fig" rid="F8">Figure 8C</xref>) and projected onto UMAP plots, respectively. We identified the cell type using specific gene markers (NNT2 and MYH7 for cardiomyocyte; DCN and COL1A1 for fibroblast; CDH5 and VWF for endothelial cell) in the control and DCM groups (<xref ref-type="sec" rid="s11">Supplementary Figure S7</xref>). We annotated one cardiomyocyte type and three distinct cardiomyocyte types in the control group and DCM group, respectively (<xref ref-type="fig" rid="F8">Figures 8A,C</xref>). Then, we analyzed the expression of NPPA, OMD, PRELP, and NPPB in cardiomyocytes of control and DCM groups. As shown in <xref ref-type="fig" rid="F9">Figures 9B,D</xref>, higher expression levels of NPPA, OMD, PRELP, and NPPB were observed in most cardiomyocytes in DCM compared to the control group. Interestingly, we noticed that type 2 of the DCM group showed high expression of NPPA and NPPB, suggesting that cardiomyocytes with higher degrees of HF in these types. We also performed Pseudotime-ordered analysis on the DCM group to explore the expression changes of NPPA, OMD, PRELP, and NPPB during the cardiomyocyte transitions along the Pseudotime. <xref ref-type="fig" rid="F9">Figure 9E</xref> showed the differentiation trajectory path of cardiomyocytes ordered by different types. <xref ref-type="fig" rid="F9">Figure 9F</xref> further displayed the stable expression patterns of NPPA, OMD, PRELP, and NPPB in diverse cardiomyocytes by Pseudotime. Notably, the dynamic expression changes of NPPA and NPPB were similar, indicating an expression linkage between NPPA and NPPB in DCM. Overall, these results showed NPPA, OMD, and PRELP were enriched in cardiomyocytes of DCM and displayed stable expression patterns, which fluctuated slightly with differential cell states.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Verification of key genes expression pattern on single-cell RNA-seq analysis. <bold>(A)</bold> UMAP projection of distinct normal cardiomyocytes in GSE95140. <bold>(B)</bold> Distribution of NPPB, NPPA, OMD, and PRELP in distinct normal cardiomyocytes. <bold>(C)</bold> UMAP projection showing three types of cardiomyocytes of DCM patients in GSE95140. <bold>(D)</bold> Distribution of NPPB, NPPA, OMD, and PRELP in distinct cardiomyocytes of DCM. <bold>(E)</bold> Pseudotime-ordered analysis of cardiomyocytes of DCM. <bold>(F)</bold> Dynamic expression of NPPB, NPPA, OMD, and PRELP by the Pseudotime.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g008.tif"/>
</fig>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>The potential pathway regulated by key genes in the development of DCM with HF. GSEA on low- and high-expression groups of NPPA <bold>(A)</bold>, OMD <bold>(B)</bold>, and PRELP <bold>(C)</bold>. <bold>(D)</bold> Intersection of TGF-&#x3b2; pathway genes significantly correlated with NPPA, OMD, and PRELP. <bold>(E)</bold> The relative expression of INHBA, ID4, TGFB3, SMAD7, and SMAD9 in TGF-&#x3b2; signaling pathway.</p>
</caption>
<graphic xlink:href="fcell-10-1089915-g009.tif"/>
</fig>
</sec>
<sec id="s3-9">
<title>NPPA, OMD, and PRELP may participate in TGF-&#x3b2; signaling pathway in DCM with HF</title>
<p>To gain insight into the potential pathways of NPPA, OMD, and PRELP, GSEA was performed for each gene. As shown in <xref ref-type="fig" rid="F9">Figure 9A</xref>, the top three positively significant KEGG pathways for NPPA were &#x201c;citrate cycle (TCA cycle)&#x201d;, &#x201c;basal cell carcinoma&#x201d;, and &#x201c;TGF-&#x3b2; signaling pathway&#x201d;. The top two positively significant KEGG pathways for OMD were enriched (<xref ref-type="fig" rid="F9">Figure 9B</xref>), including &#x201c;basal cell carcinoma&#x201d; and &#x201c;TGF-&#x3b2; signaling pathway&#x201d;. The top three positively significant KEGG pathways for PRELP shown in <xref ref-type="fig" rid="F9">Figure 9C</xref> were &#x201c;citrate cycle (TCA cycle)&#x201d;, &#x201c;basal cell carcinoma&#x201d;, and &#x201c;TGF-&#x3b2; signaling pathway&#x201d;. Interestingly, the terms &#x201c;basal cell carcinoma&#x201d; and &#x201c;TGF-&#x3b2; signaling pathway&#x201d; were enriched in the KEGG pathways of NPPA, OMD, and PRELP, and acted as the positive pathways. The TGF-&#x3b2; signaling pathway was considered the most likely mechanism involved by NPPA, OMD, and PRELP. We then analyzed Pearson&#x2019;s correlation of NPPA, OMD, and PRELP and the TGF-&#x3b2; signaling pathway gene sets (<xref ref-type="sec" rid="s11">Supplementary Table S3</xref>), respectively. And 16 NPPA-correlated, 20 OMD-correlated, and 26 PRELP-correlated genes were obtained (<xref ref-type="sec" rid="s11">Supplementary Table S4</xref>). The intersections of these genes were INHBA, ID4, TGFB3, SMAD7, and SMAD9 (<xref ref-type="fig" rid="F9">Figure 9D</xref>). Then, the expression levels of INHBA, ID4, TGFB3, SMAD7, and SMAD9 between control and DCM with HF groups were normalized and visualized in the TGF-&#x3b2; signaling pathway (<xref ref-type="fig" rid="F9">Figure 9E</xref>). Additionally, we observed that ID4, SMAD7, and SMAD9 were up-regulated in the TGF-&#x3b2; signaling pathway. While INHBA and TGFB3 were down-regulated. Accordingly, we inferred that the TGF-&#x3b2; signaling pathway positively associated with NPPA, OMD, and PRELP might play a crucial role in the process of DCM with HF.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>The pathogenesis of DCM with HF has remained unclear, mostly because of the heterogeneous etiology and clinical presentation (<xref ref-type="bibr" rid="B38">Schultheiss et al., 2019</xref>). Considering that the progressive condition of DCM leads to impaired contractility, preventing or treating HF is currently the first-line therapy for DCM patients (<xref ref-type="bibr" rid="B38">Schultheiss et al., 2019</xref>; <xref ref-type="bibr" rid="B27">Mahmaljy et al., 2022</xref>). For DCM patients with end-stage HF, the sole feasible treatment is heart transplantation (<xref ref-type="bibr" rid="B18">Iwata et al., 2020</xref>). Accordingly, identifying underlying genes and mechanisms of DCM with HF may help improve the early diagnosis and novel treatment. In this study, we conducted a systemic bioinformatics analysis on mRNA-seq and scRNA-seq data from DCM patients with HF. The promising diagnosis biomarkers were screened through WGCNA and machine learning, and the regulated potential pathway in the development of DCM with HF were further identified.</p>
<p>To our knowledge, this is the first attempt to combine WGCNA with machine learning to explore specific biomarkers to distinguish DCM patients with HF from the control group. The newly developed bioinformatics method, CBNplot, was utilized for exploring the pathway and gene interaction on Bayesian network inference (<xref ref-type="bibr" rid="B37">Sato et al., 2022</xref>). In our research, we first screened 218 DEGs (135 up-regulated genes and 83 down-regulated genes) between control and DCM with HF groups. Then, we performed GO, KEGG, and DO enrichment analyses on 135 up-regulated DEGs. The results showed that the enriched GO terms and KEGG pathways were related to muscle cell functions or activities, such as muscle cell migration, myofilament, and muscle contraction. And many heart diseases such as arteriosclerotic cardiovascular disease, coronary artery disease, and myocardial infarction were enriched. Previous studies have shown dysfunctional myocardium in DCM patients with HF (<xref ref-type="bibr" rid="B40">Schwinger et al., 1992</xref>). Thus, 135 up-regulated DGEs might involve in the pathological process of DCM with HF, were obtained for further selection. In addition, WGCNA was conducted to identify the gene module (ME blue module) that is highly positively related to DCM with HF (<italic>R</italic> &#x3d; 0.77, <italic>p</italic> &#x3c; 0.001) based on gene co-expression pattern. We then obtained 15 driver genes with higher GS and MM (C14orf132, CFH, COL8A1, CTGF, ETNPPL, FIBIN, FRZB, ITGBL1, LTBP2, MFAP4, NPPA, NRK, OMD, PRELP, SFRP4) from the ME blue module. The intersection of 15 diver genes and 135 up-regulated genes, OMD, PRELP, NPPA, LTBP2, C14orf132, FIBIN, SFRP4, FRZB, MFAP4, COL8A1, CFH, CTGF, and ITGBL1, were then selected as 13 features to construct a BNPP classifier in the training and test groups. The BPNN established with 13 neurons in the input layer, five neurons in the hidden layer, and two neurons in the output layer showed excellent classification performance in the training group (AUC &#x3d; 0.988), but the performance in the test group was poor (AUC &#x3d; 0.745). The results suggested that the BNPP on 13 feature genes was not suitable as an over-fitting model to distinguish DCM patients with HF from normal. Col-linearity between these 13 feature genes may be the reason why the over-fitting model was constructed (Supplementary Figure 2). Accordingly, further feature selection was needed to identify the key genes of DCM with HF.</p>
<p>Herein, we first performed LASSO selection to narrow the range of feature genes and identified five genes with non-zero coefficients (OMD, PRELP, NPPA, LTBP2, and CTGF). Next, five well-established machine learning algorithms, including RF, GBM, NN, XGBoost, and SVM, were applied as classifiers based on the LASSO-selected genes. We then assessed their classification performances within the training and test groups by residual, AUC score, Brier score, and NB. And RF performed with the lowest residual and Brier score, along with the highest AUC and NB was considered the best-performing classifier. Thus, three significant explanatory features (OMD, PRELP, and NPPA) in RF were selected as key genes for DCM with HF. To test whether OMD, PRELP, and NPPA could serve as diagnostic biomarkers, we analyzed their expression levels and diagnostic values in DCM with HF. Boxplots demonstrated the up-regulation of OMD, PRELP, and NPPA in the DCM with HF group. Within the training and test groups, OMD, PRELP, and NPPA had certain diagnostic values (all AUC &#x3e;0.7), of which PRELP and NPPA may have significant diagnostic abilities (all AUC &#x3e;0.8). We also found that the combination of OMD, PRELP, and NPPA could efficiently distinguish DCM patients with HF from normal, with AUC &#x3d; 0.986 in the training group and AUC &#x3d; 0.922 in the test group. These results suggested that OMD, PRELP, and NPPA may be promising diagnostic biomarkers, along with high expression levels in DCM with HF. Additionally, the heart muscle-specific and secreted expressions observed in the HPA database also demonstrated the potential application of OMD, PRELP, and NPPA as diagnostic biomarkers. Additionally, DSigDB was used to predict the therapeutic drugs targeting NPPA for finding the potential effective drug therapy of DCM with HF. Several identified drugs, including alprostadil, labetalol, felodipine, irbesartan, furosemide, and Bonuten, have been proven to cure cardiovascular diseases such as hypertension and HF. These results indicated their potential application in treating DCM with HF. However, the specific role of the predicted drugs in DCM with HF still needed further experimental validations <italic>in vivo</italic> and <italic>in vitro</italic>.</p>
<p>To further investigate the expression distributions and changes of OMD, PRELP, and NPPA, single-cell RNA-seq analysis was conducted to evaluate their expressions in cardiomyocytes derived from DCM patients. We first delineated the cardiomyocyte distributions in the control and DCM groups using UMAP plots, respectively. Leveraging gene markers (cardiomyocyte, fibroblast, and endothelial cell) from CellMarker2.0 database, distinct cardiomyocyte types were then annotated and identified. Subsequently, the high expression patterns of NPPA, OMD, and PRELP were observed in cardiomyocytes of DCM. We also explored the dynamic expression patterns of NPPA, OMD, and PRELP during the cardiomyocyte transitions across the Pseudotime. It was shown that the expression fluctuations of NPPA, OMD, and PRELP demonstrated stable expression patterns in cardiomyocyte differentiation ordered by the Pseudotime. Moreover, we found that NPPA expression pattern in DCM was similar to NPPB, a classical biomarker of HF. In summary, these results showed that the over-expression patterns of NPPA, OMD, and PRELP were relatively stable regardless of cardiomyocyte types or states, which suggests the large potential for serving diagnostic biomarkers.</p>
<p>Among the identified three genes of DCM with HF, NPPA has already been known to involved in cardiomyopathies, while reports on OMD and PRELP are limited. Atrial Natriuretic Peptide (ANP) encoded by NPPA belongs to the natriuretic peptide family and has been developed to be diagnostic biomarkers of HF (<xref ref-type="bibr" rid="B15">Goetze et al., 2020</xref>), which also demonstrated NPPA can be a positive biomarker control to validate our analysis accuracy. OMD encoded a leucine-rich keratin sulfate proteoglycan located in the extracellular matrix (ECM), which participated in cell adhesion and tissue mineralization (<xref ref-type="bibr" rid="B44">Skenteris et al., 2022</xref>). A recent study unraveled that OMD may be an early plasma biomarker of cardiovascular calcification (<xref ref-type="bibr" rid="B44">Skenteris et al., 2022</xref>). Furthermore, the association between OMD and cardiovascular risk factors was observed in a large aptamer-based proteomic profiling research (<xref ref-type="bibr" rid="B32">Ngo et al., 2021</xref>). Interestingly, a bioinformatics study identified OMD as the promising biomarker and therapeutic target of hypertrophic cardiomyopathy (<xref ref-type="bibr" rid="B16">Guo et al., 2021</xref>). PRELP belongs to the leucine-rich repeat (LRR) family, and encodes a leucine-rich repeat protein, which exists in ECM of connective tissues (<xref ref-type="bibr" rid="B6">Bengtsson et al., 1995</xref>). The role of PRELP in cardiac extracellular matrix remodeling has been demonstrated in proteomics research on the ischemia/reperfusion injury model (<xref ref-type="bibr" rid="B4">Barallobre-Barreiro et al., 2012</xref>). Zhang et al. recently reported that PRELP led to myocardial fibrosis and ventricular remodeling following acute myocardial infarction, which highlights the role of PRELP in cardiovascular disease (<xref ref-type="bibr" rid="B52">Zhang et al., 2022</xref>). Overall, previous studies have elucidated the pathological roles or diagnostic values of NPPA, OMD, and PRELP in different cardiovascular diseases, but have not yet involved DCM with HF.</p>
<p>To explore the common underlying mechanism of NPPA, OMD, and PRELP in DCM with HF, we performed GSEA based on KEGG gene sets. The GSEA results indicated that the KEGG pathways of NPPA, OMD, and PRELP were all enriched in the TGF-&#x3b2; signaling pathway. Thus, TGF-&#x3b2; signaling pathway might serve as a crucial mechanism in DCM with HF. Next, we analyzed the correlation between each key gene (NPPA, OMD, PRELP) and the TGF-&#x3b2; signaling pathway-related genes. INHBA, ID4, TGFB3, SMAD7, and SMAD9, the intersection of the NPPA-correlated, OMD-correlated, and PRELP-correlated genes, were considered the most likely affected genes in the TGF-&#x3b2; signaling pathway. And the up-regulation of ID4, SMAD7, and SMAD9 and down-regulation of INHBA, TGFB3 were observed in DCM with HF group. Evolving studies demonstrate that TGF-&#x3b2; signaling pathway is critically participated in HF and cardiac remodeling (<xref ref-type="bibr" rid="B10">Dobaczewski et al., 2011</xref>). Increased systemic and myocardial TGF-&#x3b2; levels were found in patients with DCM, suggesting the activation of TGF-&#x3b2; signaling pathway, which was consistent with our result (<xref ref-type="bibr" rid="B10">Dobaczewski et al., 2011</xref>). Thus, combining with the previous experimental evidence and our GSEA result, we speculated that the mediators of TGF-&#x3b2; signaling pathway may exert crucial actions through interacting with NPPA, OMD, and PRELP on the pathogenesis of DCM with HF.</p>
<p>However, there exists some shortcomings in our study. First, the five machine learning classifiers were established on small training data sets because of the limited databases of DCM with HF. Nevertheless, the best-performing classifier was comprehensively validated and then confirmed by a series of indexes. Accordingly, the selected features (key genes) were considered the most significant. Second, the up-regulation pattern of key genes (NPPA, OMD, and PRELP) needed further experimental verification, such as quantitative polymerase chain reaction or immunohistochemistry. Herein, to ensure the credibility of our analysis, external gene expression profiling and single-cell RNA seq data were used for validation. Third, combined GSEA and correlation analysis, we speculated that the TGF-&#x3b2; signaling pathway linking with NPPA, OMD, and PRELP might play a crucial role in DCM with HF. However, further functional studies are still needed to elucidate the specific roles and pathways of NPPA, OMD, and PRELP in DCM with HF.</p>
<p>In conclusion, we conducted a comprehensive bioinformatics study based on gene expression profiles and single-cell RNA sequencing datasets derived from DCM with HF patients. First, the combined analysis of WGCNA and RF classifier identified three key genes for the diagnosis of DCM with HF, out of which were NPPA, OMD, and PRELP. In addition, NPPA, OMD, and PRELP were increased in DCM with HF and showed excellent diagnostic abilities. And the up-regulated expression patterns of NPPA, OMD, and PRELP were stable, with minor fluctuation affected by differential cell states. Besides, the TGF-&#x3b2; signaling pathway, interacting with NPPA, OMD, and PRELP, may serve as a critical mechanism involvement in DCM with HF.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: Three gene expression profiling datasets of DCM with HF (GSE29819, GSE21610, GSE17800) and one single-cell RNA-sequencing dataset of DCM (GSE95140) were obtained from the GEO database (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>).</p>
</sec>
<sec id="s6">
<title>Ethics statement</title>
<p>Written informed consent was obtained from the individual(s) for the publication of any potentially identifiable images or data included in this article.</p>
</sec>
<sec id="s7">
<title>Author contributions</title>
<p>YHZ and YZ conceived and designed the study. YHZ and XY collected the data, performed the analyzes, and assembled the results. YHZ wrote the manuscript. YHZ and YZ edited and revised the manuscript. All authors reviewed the paper and approved the final manuscript.</p>
</sec>
<sec id="s8">
<title>Funding</title>
<p>The work is supported by grants from the National Natural Science Foundation of China 32170423 and 31501166, Chenguang Program 14CG49 from the Shanghai Education Committee, Shanghai Sailing Program of Science and Technology Commission of Shanghai Municipality 15YF1405000, and Shanghai Ocean University Fund for Science and Technology Development.</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fcell.2022.1089915/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fcell.2022.1089915/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Image3.JPEG" id="SM1" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image1.JPEG" id="SM2" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image4.JPEG" id="SM3" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image7.JPEG" id="SM4" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image2.JPEG" id="SM5" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image5.JPEG" id="SM6" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.DOCX" id="SM7" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image6.JPEG" id="SM8" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ai</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Colorectal cancer prediction based on weighted gene co-expression network analysis and variational auto-encoder</article-title>. <source>Biomolecules</source> <volume>10</volume> (<issue>9</issue>), <fpage>1207</fpage>. <pub-id pub-id-type="doi">10.3390/biom10091207</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alba</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Agoritsas</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Walsh</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hanna</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Iorio</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Devereaux</surname>
<given-names>P. J.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Discrimination and calibration of clinical prediction models: Users&#x27; guides to the medical literature</article-title>. <source>Jama</source> <volume>318</volume> (<issue>14</issue>), <fpage>1377</fpage>&#x2013;<lpage>1384</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2017.12126</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ameling</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Herda</surname>
<given-names>L. R.</given-names>
</name>
<name>
<surname>Hammer</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Steil</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Teumer</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Trimpert</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Myocardial gene expression profiles and cardiodepressant autoantibodies predict response of patients with dilated cardiomyopathy to immunoadsorption therapy</article-title>. <source>Eur. Heart J.</source> <volume>34</volume> (<issue>9</issue>), <fpage>666</fpage>&#x2013;<lpage>675</lpage>. <pub-id pub-id-type="doi">10.1093/eurheartj/ehs330</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barallobre-Barreiro</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Didangelos</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Schoendube</surname>
<given-names>F. A.</given-names>
</name>
<name>
<surname>Drozdov</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Fern&#xe1;ndez-Caggiano</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Proteomics analysis of cardiac extracellular matrix remodeling in a porcine model of ischemia/reperfusion injury</article-title>. <source>Circulation</source> <volume>125</volume> (<issue>6</issue>), <fpage>789</fpage>&#x2013;<lpage>802</lpage>. <pub-id pub-id-type="doi">10.1161/circulationaha.111.056952</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barth</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Kuner</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Buness</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ruschhaupt</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Merk</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zwermann</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>Identification of a common gene expression signature in dilated cardiomyopathy across independent microarray studies</article-title>. <source>J. Am. Coll. Cardiol.</source> <volume>48</volume> (<issue>8</issue>), <fpage>1610</fpage>&#x2013;<lpage>1617</lpage>. <pub-id pub-id-type="doi">10.1016/j.jacc.2006.07.026</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bengtsson</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Neame</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Heineg&#xe5;rd</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Sommarin</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>The primary structure of a basic leucine-rich repeat protein, PRELP, found in connective tissues</article-title>. <source>J. Biol. Chem.</source> <volume>270</volume> (<issue>43</issue>), <fpage>25639</fpage>&#x2013;<lpage>25644</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.270.43.25639</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carniel</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Taylor</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Sinagra</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Di Lenarda</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ku</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Fain</surname>
<given-names>P. R.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Alpha-myosin heavy chain: A sarcomeric gene associated with dilated and hypertrophic phenotypes of cardiomyopathy</article-title>. <source>Circulation</source> <volume>112</volume> (<issue>1</issue>), <fpage>54</fpage>&#x2013;<lpage>59</lpage>. <pub-id pub-id-type="doi">10.1161/circulationaha.104.507699</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cattaneo</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Pola</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Deh&#xf2;</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Sanguini</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Vicentini</surname>
<given-names>L. M.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Alprostadil suppresses angiogenesis <italic>in vitro</italic> and <italic>in vivo</italic> in the murine Matrigel plug assay</article-title>. <source>Br. J. Pharmacol.</source> <volume>138</volume> (<issue>2</issue>), <fpage>377</fpage>&#x2013;<lpage>385</lpage>. <pub-id pub-id-type="doi">10.1038/sj.bjp.0705051</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Identification of crucial genes and pathways in human arrhythmogenic right ventricular cardiomyopathy by coexpression analysis</article-title>. <source>Front. Physiol.</source> <volume>9</volume>, <fpage>1778</fpage>. <pub-id pub-id-type="doi">10.3389/fphys.2018.01778</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dobaczewski</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Frangogiannis</surname>
<given-names>N. G.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Transforming growth factor (TGF)-&#x3b2; signaling in cardiac remodeling</article-title>. <source>J. Mol. Cell. Cardiol.</source> <volume>51</volume> (<issue>4</issue>), <fpage>600</fpage>&#x2013;<lpage>606</lpage>. <pub-id pub-id-type="doi">10.1016/j.yjmcc.2010.10.033</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fatkin</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>MacRae</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Sasaki</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wolff</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Porcu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Frenneaux</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>1999</year>). <article-title>Missense mutations in the rod domain of the lamin A/C gene as causes of dilated cardiomyopathy and conduction-system disease</article-title>. <source>N. Engl. J. Med.</source> <volume>341</volume> (<issue>23</issue>), <fpage>1715</fpage>&#x2013;<lpage>1724</lpage>. <pub-id pub-id-type="doi">10.1056/nejm199912023412302</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fitzgerald</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Saville</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>Lewis</surname>
<given-names>R. J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Decision curve analysis</article-title>. <source>Jama</source> <volume>313</volume> (<issue>4</issue>), <fpage>409</fpage>&#x2013;<lpage>410</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2015.37</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gaertner</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Schwientek</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ellinghaus</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Summer</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Golz</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kassner</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Myocardial transcriptome analysis of human arrhythmogenic right ventricular cardiomyopathy</article-title>. <source>Physiol. Genomics</source> <volume>44</volume> (<issue>1</issue>), <fpage>99</fpage>&#x2013;<lpage>109</lpage>. <pub-id pub-id-type="doi">10.1152/physiolgenomics.00094.2011</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gerull</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Gramlich</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Atherton</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>McNabb</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Trombit&#xe1;s</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Sasse-Klaassen</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2002</year>). <article-title>Mutations of TTN, encoding the giant muscle filament titin, cause familial dilated cardiomyopathy</article-title>. <source>Nat. Genet.</source> <volume>30</volume> (<issue>2</issue>), <fpage>201</fpage>&#x2013;<lpage>204</lpage>. <pub-id pub-id-type="doi">10.1038/ng815</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goetze</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Bruneau</surname>
<given-names>B. G.</given-names>
</name>
<name>
<surname>Ramos</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Ogawa</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>de Bold</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>de Bold</surname>
<given-names>A. J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Cardiac natriuretic peptides</article-title>. <source>Nat. Rev. Cardiol.</source> <volume>17</volume> (<issue>11</issue>), <fpage>698</fpage>&#x2013;<lpage>717</lpage>. <pub-id pub-id-type="doi">10.1038/s41569-020-0381-0</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ou</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Osteomodulin is a potential genetic target for hypertrophic cardiomyopathy</article-title>. <source>Biochem. Genet.</source> <volume>59</volume> (<issue>5</issue>), <fpage>1185</fpage>&#x2013;<lpage>1202</lpage>. <pub-id pub-id-type="doi">10.1007/s10528-021-10050-1</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yuan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Edgerton</surname>
<given-names>M. E.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>The Pan-Cancer analysis of pseudogene expression reveals biologically and clinically relevant tumour subtypes</article-title>. <source>Nat. Commun.</source> <volume>5</volume>, <fpage>3963</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms4963</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iwata</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ito</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wakabayashi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kitakaze</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>TRPV2 channel as a possible drug target for the treatment of heart failure</article-title>. <source>Lab. Invest.</source> <volume>100</volume> (<issue>2</issue>), <fpage>207</fpage>&#x2013;<lpage>217</lpage>. <pub-id pub-id-type="doi">10.1038/s41374-019-0349-z</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Japp</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>Gulati</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cook</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Cowie</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Prasad</surname>
<given-names>S. K.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>The diagnosis and evaluation of dilated cardiomyopathy</article-title>. <source>J. Am. Coll. Cardiol.</source> <volume>67</volume> (<issue>25</issue>), <fpage>2996</fpage>&#x2013;<lpage>3010</lpage>. <pub-id pub-id-type="doi">10.1016/j.jacc.2016.03.590</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Fugman</surname>
<given-names>D. A.</given-names>
</name>
</person-group> (<year>1983</year>). <article-title>Calcium and calmodulin antagonists binding to calmodulin and relaxation of coronary segments</article-title>. <source>J. Pharmacol. Exp. Ther.</source> <volume>226</volume> (<issue>2</issue>), <fpage>330</fpage>&#x2013;<lpage>334</lpage>.</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Karsoliya</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Approximating number of hidden layer neurons in multiple hidden layer BPNN architecture</article-title>. <source>Int. J. Eng. Trends Technol.</source> <volume>3</volume> (<issue>6</issue>), <fpage>714</fpage>&#x2013;<lpage>717</lpage>.</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaundal</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kapoor</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Raghava</surname>
<given-names>G. P.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Machine learning techniques in disease forecasting: A case study on rice blast prediction</article-title>. <source>BMC Bioinforma.</source> <volume>7</volume>, <fpage>485</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-7-485</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kuleshov</surname>
<given-names>M. V.</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Rouillard</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Fernandez</surname>
<given-names>N. F.</given-names>
</name>
<name>
<surname>Duan</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Enrichr: A comprehensive gene set enrichment analysis web server 2016 update</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume> (<issue>W1</issue>), <fpage>W90</fpage>&#x2013;<lpage>W97</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw377</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Langfelder</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Horvath</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Wgcna: an R package for weighted correlation network analysis</article-title>. <source>BMC Bioinforma.</source> <volume>9</volume>, <fpage>559</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-9-559</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Pant</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Bhavnasi</surname>
<given-names>Y. K.</given-names>
</name>
<name>
<surname>Blanchard</surname>
<given-names>S. G.</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Brouwer</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Pathview web: User friendly pathway visualization and data integration</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume> (<issue>W1</issue>), <fpage>W501</fpage>&#x2013;<lpage>w508</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkx372</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>MacCarthy</surname>
<given-names>E. P.</given-names>
</name>
<name>
<surname>Bloomfield</surname>
<given-names>S. S.</given-names>
</name>
</person-group> (<year>1983</year>). <article-title>Labetalol: A review of its pharmacology, pharmacokinetics, clinical uses and adverse effects</article-title>. <source>Pharmacotherapy</source> <volume>3</volume> (<issue>4</issue>), <fpage>193</fpage>&#x2013;<lpage>219</lpage>. <pub-id pub-id-type="doi">10.1002/j.1875-9114.1983.tb03252.x</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Mahmaljy</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yelamanchili</surname>
<given-names>V. S.</given-names>
</name>
<name>
<surname>Singhal</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2022</year>). &#x201c;<article-title>Dilated cardiomyopathy</article-title>,&#x201d; in <source>
<italic>StatPearls</italic>. (Treasure island (FL)</source> (<publisher-loc>Florida</publisher-loc>: <publisher-name>StatPearls Publishing</publisher-name>).</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mazzarotto</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Tayal</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Buchan</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Midwinter</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wilk</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Whiffin</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Reevaluating the genetic contribution of monogenic dilated cardiomyopathy</article-title>. <source>Circulation</source> <volume>141</volume> (<issue>5</issue>), <fpage>387</fpage>&#x2013;<lpage>398</lpage>. <pub-id pub-id-type="doi">10.1161/circulationaha.119.037661</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McDonagh</surname>
<given-names>T. A.</given-names>
</name>
<name>
<surname>Metra</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Adamo</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gardner</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Baumbach</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>B&#xf6;hm</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>2021 ESC Guidelines for the diagnosis and treatment of acute and chronic heart failure: Developed by the Task Force for the diagnosis and treatment of acute and chronic heart failure of the European Society of Cardiology (ESC). With the special contribution of the Heart Failure Association (HFA) of the ESC</article-title>. <source>Eur. J. Heart Fail.</source> <volume>24</volume> (<issue>1</issue>), <fpage>4</fpage>&#x2013;<lpage>131</lpage>. <pub-id pub-id-type="doi">10.1002/ejhf.2333</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McNally</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Mestroni</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Dilated cardiomyopathy: Genetic determinants and mechanisms</article-title>. <source>Circ. Res.</source> <volume>121</volume> (<issue>7</issue>), <fpage>731</fpage>&#x2013;<lpage>748</lpage>. <pub-id pub-id-type="doi">10.1161/circresaha.116.309396</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Merlo</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pivetta</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pinamonti</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Stolfo</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zecchin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Barbati</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Long-term prognostic impact of therapeutic strategies in patients with idiopathic dilated cardiomyopathy: Changing mortality over the last 30 years</article-title>. <source>Eur. J. Heart Fail.</source> <volume>16</volume> (<issue>3</issue>), <fpage>317</fpage>&#x2013;<lpage>324</lpage>. <pub-id pub-id-type="doi">10.1002/ejhf.16</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ngo</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Benson</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>J. Z.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Z. Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Nath</surname>
<given-names>A. K.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Proteomic profiling reveals biomarkers and pathways in type 2 diabetes risk</article-title>. <source>JCI Insight</source> <volume>6</volume> (<issue>5</issue>), <fpage>e144392</fpage>. <pub-id pub-id-type="doi">10.1172/jci.insight.144392</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nomura</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Satoh</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fujita</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Higo</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sumida</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ko</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Cardiomyocyte gene programs encoding morphological and functional signatures in cardiac hypertrophy and failure</article-title>. <source>Nat. Commun.</source> <volume>9</volume> (<issue>1</issue>), <fpage>4435</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-018-06639-7</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olson</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Cava</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Mustahsan</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Varik</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>J. H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Data-driven advice for applying machine learning to bioinformatics problems</article-title>. <source>Pac. Symp. Biocomput.</source> <volume>23</volume>, <fpage>192</fpage>&#x2013;<lpage>203</lpage>.</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Placenta inflammation is closely associated with gestational diabetes mellitus</article-title>. <source>Am. J. Transl. Res.</source> <volume>13</volume> (<issue>5</issue>), <fpage>4068</fpage>&#x2013;<lpage>4079</lpage>.</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ruan</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kan</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Back propagation neural network model for medical expenses in patients with breast cancer</article-title>. <source>Math. Biosci. Eng.</source> <volume>18</volume> (<issue>4</issue>), <fpage>3690</fpage>&#x2013;<lpage>3698</lpage>. <pub-id pub-id-type="doi">10.3934/mbe.2021185</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sato</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Tamada</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Okuno</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>CBNplot: Bayesian network plots for enrichment analysis</article-title>. <source>Bioinformatics</source> <volume>38</volume> (<issue>10</issue>), <fpage>2959</fpage>&#x2013;<lpage>2960</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btac175</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schultheiss</surname>
<given-names>H. P.</given-names>
</name>
<name>
<surname>Fairweather</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Caforio</surname>
<given-names>A. L. P.</given-names>
</name>
<name>
<surname>Escher</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Hershberger</surname>
<given-names>R. E.</given-names>
</name>
<name>
<surname>Lipshultz</surname>
<given-names>S. E.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Dilated cardiomyopathy</article-title>. <source>Nat. Rev. Dis. Prim.</source> <volume>5</volume> (<issue>1</issue>), <fpage>32</fpage>. <pub-id pub-id-type="doi">10.1038/s41572-019-0084-1</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schwientek</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ellinghaus</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Steppan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>D&#x27;Urso</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Seewald</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kassner</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>Global gene expression analysis in nonfailing and failing myocardium pre- and postpulsatile and nonpulsatile ventricular assist device support</article-title>. <source>Physiol. Genomics</source> <volume>42</volume> (<issue>3</issue>), <fpage>397</fpage>&#x2013;<lpage>405</lpage>. <pub-id pub-id-type="doi">10.1152/physiolgenomics.00030.2010</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schwinger</surname>
<given-names>R. H.</given-names>
</name>
<name>
<surname>B&#xf6;hm</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Erdmann</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>Inotropic and lusitropic dysfunction in myocardium from patients with dilated cardiomyopathy</article-title>. <source>Am. Heart J.</source> <volume>123</volume> (<issue>1</issue>), <fpage>116</fpage>&#x2013;<lpage>128</lpage>. <pub-id pub-id-type="doi">10.1016/0002-8703(92)90755-k</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seferovi&#x107;</surname>
<given-names>P. M.</given-names>
</name>
<name>
<surname>Polovina</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bauersachs</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Arad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ben Gal</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Lund</surname>
<given-names>L. H.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Heart failure in cardiomyopathies: A position paper from the heart failure association of the European society of cardiology</article-title>. <source>Eur. J. Heart Fail.</source> <volume>21</volume> (<issue>5</issue>), <fpage>553</fpage>&#x2013;<lpage>576</lpage>. <pub-id pub-id-type="doi">10.1002/ejhf.1461</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seidman</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Seidman</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>The genetic basis for cardiomyopathy: From mutation identification to mechanistic paradigms</article-title>. <source>Cell.</source> <volume>104</volume> (<issue>4</issue>), <fpage>557</fpage>&#x2013;<lpage>567</lpage>. <pub-id pub-id-type="doi">10.1016/s0092-8674(01)00242-2</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sheridan</surname>
<given-names>R. P.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W. M.</given-names>
</name>
<name>
<surname>Liaw</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gifford</surname>
<given-names>E. M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Extreme gradient boosting as a method for quantitative structure-activity relationships</article-title>. <source>J. Chem. Inf. Model.</source> <volume>56</volume> (<issue>12</issue>), <fpage>2353</fpage>&#x2013;<lpage>2360</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.6b00591</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Skenteris</surname>
<given-names>N. T.</given-names>
</name>
<name>
<surname>Seime</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Witasp</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Karl&#xf6;f</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Wasilewski</surname>
<given-names>G. B.</given-names>
</name>
<name>
<surname>Heuschkel</surname>
<given-names>M. A.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Osteomodulin attenuates smooth muscle cell osteogenic transition in vascular calcification</article-title>. <source>Clin. Transl. Med.</source> <volume>12</volume> (<issue>2</issue>), <fpage>e682</fpage>. <pub-id pub-id-type="doi">10.1002/ctm2.682</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Swedberg</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kjekshus</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Group</surname>
<given-names>C. T. S.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>Effects of enalapril on mortality in severe congestive heart failure. Results of the cooperative north scandinavian enalapril survival study (CONSENSUS)</article-title>. <source>N. Engl. J. Med.</source> <volume>316</volume> (<issue>23</issue>), <fpage>1429</fpage>&#x2013;<lpage>1435</lpage>. <pub-id pub-id-type="doi">10.1056/nejm198706043162301</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thompson</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Arden</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Marshall</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Wingrove</surname>
<given-names>P. B.</given-names>
</name>
<name>
<surname>Whiting</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Wafford</surname>
<given-names>K. A.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Residues in transmembrane domains I and II determine gamma-aminobutyric acid type AA receptor subtype-selective antagonism by furosemide</article-title>. <source>Mol. Pharmacol.</source> <volume>55</volume> (<issue>6</issue>), <fpage>993</fpage>&#x2013;<lpage>999</lpage>. <pub-id pub-id-type="doi">10.1124/mol.55.6.993</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tian</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zou</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Construction and analysis of a joint diagnosis model of random forest and artificial neural network for heart failure</article-title>. <source>Aging (Albany NY)</source> <volume>12</volume> (<issue>24</issue>), <fpage>26221</fpage>&#x2013;<lpage>26235</lpage>. <pub-id pub-id-type="doi">10.18632/aging.202405</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weintraub</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Semsarian</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Macdonald</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Dilated cardiomyopathy</article-title>. <source>Lancet</source> <volume>390</volume> (<issue>10092</issue>), <fpage>400</fpage>&#x2013;<lpage>414</lpage>. <pub-id pub-id-type="doi">10.1016/s0140-6736(16)31713-5</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Study of cardiovascular disease prediction model based on random forest in eastern China</article-title>. <source>Sci. Rep.</source> <volume>10</volume> (<issue>1</issue>), <fpage>5245</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-62133-5</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Quan</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>CellMarker: A manually curated resource of cell markers in human and mouse</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume> (<issue>D1</issue>), <fpage>D721</fpage>&#x2013;<lpage>d728</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky900</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>PRELP promotes myocardial fibrosis and ventricular remodelling after acute myocardial infarction by the wnt/&#x3b2;-catenin signalling pathway</article-title>. <source>Cardiovasc. J. Afr.</source> <volume>33</volume>, <fpage>228</fpage>&#x2013;<lpage>233</lpage>. <pub-id pub-id-type="doi">10.5830/cvja-2022-001</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Weng</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Exploring key genes to construct a diagnosis model of dilated cardiomyopathy</article-title>. <source>Front. Cardiovasc. Med.</source> <volume>9</volume>, <fpage>865096</fpage>. <pub-id pub-id-type="doi">10.3389/fcvm.2022.865096</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>